Signed-off-by: -LAN- <laipz8200@outlook.com>tags/0.15.3
| @@ -1,3 +1,4 @@ | |||
| - deepseek-ai/deepseek-r1 | |||
| - google/gemma-7b | |||
| - google/codegemma-7b | |||
| - google/recurrentgemma-2b | |||
| @@ -0,0 +1,35 @@ | |||
| model: deepseek-ai/deepseek-r1 | |||
| label: | |||
| en_US: deepseek-ai/deepseek-r1 | |||
| model_type: llm | |||
| features: | |||
| - agent-thought | |||
| model_properties: | |||
| mode: chat | |||
| context_size: 128000 | |||
| parameter_rules: | |||
| - name: temperature | |||
| use_template: temperature | |||
| min: 0 | |||
| max: 1 | |||
| default: 0.5 | |||
| - name: top_p | |||
| use_template: top_p | |||
| min: 0 | |||
| max: 1 | |||
| default: 1 | |||
| - name: max_tokens | |||
| use_template: max_tokens | |||
| min: 1 | |||
| max: 1024 | |||
| default: 1024 | |||
| - name: frequency_penalty | |||
| use_template: frequency_penalty | |||
| min: -2 | |||
| max: 2 | |||
| default: 0 | |||
| - name: presence_penalty | |||
| use_template: presence_penalty | |||
| min: -2 | |||
| max: 2 | |||
| default: 0 | |||
| @@ -83,7 +83,7 @@ class NVIDIALargeLanguageModel(OAIAPICompatLargeLanguageModel): | |||
| def _add_custom_parameters(self, credentials: dict, model: str) -> None: | |||
| credentials["mode"] = "chat" | |||
| if self.MODEL_SUFFIX_MAP[model]: | |||
| if self.MODEL_SUFFIX_MAP.get(model): | |||
| credentials["server_url"] = f"https://ai.api.nvidia.com/v1/{self.MODEL_SUFFIX_MAP[model]}" | |||
| credentials.pop("endpoint_url") | |||
| else: | |||