From 00458a31d58624d51ea5c7dff255902ecd6ff865 Mon Sep 17 00:00:00 2001 From: Riddhimaan-Senapati <114703025+Riddhimaan-Senapati@users.noreply.github.com> Date: Wed, 5 Feb 2025 08:59:18 -0500 Subject: [PATCH] feat: added deepseek r1 and v3 to siliconflow (#13238) --- .../siliconflow/llm/deepseek-r1.yaml | 21 ++++++++ .../siliconflow/llm/deepseek-v3.yaml | 53 +++++++++++++++++++ 2 files changed, 74 insertions(+) create mode 100644 api/core/model_runtime/model_providers/siliconflow/llm/deepseek-r1.yaml create mode 100644 api/core/model_runtime/model_providers/siliconflow/llm/deepseek-v3.yaml diff --git a/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-r1.yaml b/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-r1.yaml new file mode 100644 index 00000000000000..44c6a9d55e4913 --- /dev/null +++ b/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-r1.yaml @@ -0,0 +1,21 @@ +model: deepseek-ai/DeepSeek-R1 +label: + zh_Hans: deepseek-ai/DeepSeek-R1 + en_US: deepseek-ai/DeepSeek-R1 +model_type: llm +features: + - agent-thought +model_properties: + mode: chat + context_size: 64000 +parameter_rules: + - name: max_tokens + use_template: max_tokens + min: 1 + max: 8192 + default: 4096 +pricing: + input: "4" + output: "16" + unit: "0.000001" + currency: RMB diff --git a/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-v3.yaml b/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-v3.yaml new file mode 100644 index 00000000000000..ed1a5f00992b7c --- /dev/null +++ b/api/core/model_runtime/model_providers/siliconflow/llm/deepseek-v3.yaml @@ -0,0 +1,53 @@ +model: deepseek-ai/DeepSeek-V3 +label: + en_US: deepseek-ai/DeepSeek-V3 +model_type: llm +features: + - agent-thought + - tool-call + - stream-tool-call +model_properties: + mode: chat + context_size: 64000 +parameter_rules: + - name: temperature + use_template: temperature + - name: max_tokens + use_template: max_tokens + type: int + default: 512 + min: 1 + max: 4096 + help: + zh_Hans: 指定生成结果长度的上限。如果生成结果截断,可以调大该参数。 + en_US: Specifies the upper limit on the length of generated results. If the generated results are truncated, you can increase this parameter. + - name: top_p + use_template: top_p + - name: top_k + label: + zh_Hans: 取样数量 + en_US: Top k + type: int + help: + zh_Hans: 仅从每个后续标记的前 K 个选项中采样。 + en_US: Only sample from the top K options for each subsequent token. + required: false + - name: frequency_penalty + use_template: frequency_penalty + - name: response_format + label: + zh_Hans: 回复格式 + en_US: Response Format + type: string + help: + zh_Hans: 指定模型必须输出的格式 + en_US: specifying the format that the model must output + required: false + options: + - text + - json_object +pricing: + input: "1" + output: "2" + unit: "0.000001" + currency: RMB