From 21664738523f9bae64ec91f075dbdfcd65e10c7e Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=91=86=E8=90=8C=E9=97=B7=E6=B2=B9=E7=93=B6?= <253605712@qq.com> Date: Wed, 31 Jan 2024 17:57:17 +0800 Subject: [PATCH] Feat/add spark3.5 llm (#2314) Co-authored-by: lux@njuelectronics.com Co-authored-by: crazywoola <427733928@qq.com> --- .../model_providers/spark/llm/_client.py | 4 +++ .../model_providers/spark/llm/_position.yaml | 4 +++ .../model_providers/spark/llm/spark-3.5.yaml | 33 +++++++++++++++++++ api/core/third_party/spark/spark_llm.py | 4 +++ 4 files changed, 45 insertions(+) create mode 100644 api/core/model_runtime/model_providers/spark/llm/_position.yaml create mode 100644 api/core/model_runtime/model_providers/spark/llm/spark-3.5.yaml diff --git a/api/core/model_runtime/model_providers/spark/llm/_client.py b/api/core/model_runtime/model_providers/spark/llm/_client.py index 37ae40c1d8..9390f4351b 100644 --- a/api/core/model_runtime/model_providers/spark/llm/_client.py +++ b/api/core/model_runtime/model_providers/spark/llm/_client.py @@ -35,6 +35,10 @@ class SparkLLMClient: 'spark-3': { 'version': 'v3.1', 'chat_domain': 'generalv3' + }, + 'spark-3.5': { + 'version': 'v3.5', + 'chat_domain': 'generalv3.5' } } diff --git a/api/core/model_runtime/model_providers/spark/llm/_position.yaml b/api/core/model_runtime/model_providers/spark/llm/_position.yaml new file mode 100644 index 0000000000..64c2db77ce --- /dev/null +++ b/api/core/model_runtime/model_providers/spark/llm/_position.yaml @@ -0,0 +1,4 @@ +- spark-3.5 +- spark-3 +- spark-1.5 +- spark-2 diff --git a/api/core/model_runtime/model_providers/spark/llm/spark-3.5.yaml b/api/core/model_runtime/model_providers/spark/llm/spark-3.5.yaml new file mode 100644 index 0000000000..650eff5d98 --- /dev/null +++ b/api/core/model_runtime/model_providers/spark/llm/spark-3.5.yaml @@ -0,0 +1,33 @@ +model: spark-3.5 +label: + en_US: Spark V3.5 +model_type: llm +model_properties: + mode: chat +parameter_rules: + - name: temperature + use_template: temperature + default: 0.5 + help: + zh_Hans: 核采样阈值。用于决定结果随机性,取值越高随机性越强即相同的问题得到的不同答案的可能性越高。 + en_US: Kernel sampling threshold. Used to determine the randomness of the results. The higher the value, the stronger the randomness, that is, the higher the possibility of getting different answers to the same question. + - name: max_tokens + use_template: max_tokens + default: 2048 + min: 1 + max: 8192 + help: + zh_Hans: 模型回答的tokens的最大长度。 + en_US: 模型回答的tokens的最大长度。 + - name: top_k + label: + zh_Hans: 取样数量 + en_US: Top k + type: int + default: 4 + min: 1 + max: 6 + help: + zh_Hans: 从 k 个候选中随机选择⼀个(⾮等概率)。 + en_US: Randomly select one from k candidates (non-equal probability). + required: false diff --git a/api/core/third_party/spark/spark_llm.py b/api/core/third_party/spark/spark_llm.py index 637c1bc740..ff7f04c396 100644 --- a/api/core/third_party/spark/spark_llm.py +++ b/api/core/third_party/spark/spark_llm.py @@ -35,6 +35,10 @@ class SparkLLMClient: 'spark-v3': { 'version': 'v3.1', 'chat_domain': 'generalv3' + }, + 'spark-v3.5': { + 'version': 'v3.5', + 'chat_domain': 'generalv3.5' } }