Upgrade oracle models (#13174)

Co-authored-by: engchina <atjapan2015@gmail.com>
2025-08-16 20:15:58 +08:00 · 2025-02-06 13:24:27 +08:00 · 2025-02-06 13:24:27 +08:00 · 40dd63ecef
commit 40dd63ecef
parent 6d66d6da15
8 changed files with 164 additions and 6 deletions
--- a/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-08-2024.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-08-2024.yaml
@ -0,0 +1,52 @@
 model: cohere.command-r-08-2024
 label:
  en_US: cohere.command-r-08-2024 v1.7
 model_type: llm
 features:
  - multi-tool-call
  - agent-thought
  - stream-tool-call
 model_properties:
  mode: chat
  context_size: 128000
 parameter_rules:
  - name: temperature
    use_template: temperature
    default: 1
    max: 1.0
  - name: topP
    use_template: top_p
    default: 0.75
    min: 0
    max: 1
  - name: topK
    label:
      zh_Hans: 取样数量
      en_US: Top k
    type: int
    help:
      zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
      en_US: Only sample from the top K options for each subsequent token.
    required: false
    default: 0
    min: 0
    max: 500
  - name: presencePenalty
    use_template: presence_penalty
    min: 0
    max: 1
    default: 0
  - name: frequencyPenalty
    use_template: frequency_penalty
    min: 0
    max: 1
    default: 0
  - name: maxTokens
    use_template: max_tokens
    default: 600
    max: 4000
 pricing:
  input: '0.0009'
  output: '0.0009'
  unit: '0.0001'
  currency: USD
--- a/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-16k.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-16k.yaml
@ -50,3 +50,4 @@ pricing:
  output: '0.004'
  unit: '0.0001'
  currency: USD
 deprecated: true
--- a/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-plus-08-2024.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-plus-08-2024.yaml
@ -0,0 +1,52 @@
 model: cohere.command-r-plus-08-2024
 label:
  en_US: cohere.command-r-plus-08-2024 v1.6
 model_type: llm
 features:
  - multi-tool-call
  - agent-thought
  - stream-tool-call
 model_properties:
  mode: chat
  context_size: 128000
 parameter_rules:
  - name: temperature
    use_template: temperature
    default: 1
    max: 1.0
  - name: topP
    use_template: top_p
    default: 0.75
    min: 0
    max: 1
  - name: topK
    label:
      zh_Hans: 取样数量
      en_US: Top k
    type: int
    help:
      zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
      en_US: Only sample from the top K options for each subsequent token.
    required: false
    default: 0
    min: 0
    max: 500
  - name: presencePenalty
    use_template: presence_penalty
    min: 0
    max: 1
    default: 0
  - name: frequencyPenalty
    use_template: frequency_penalty
    min: 0
    max: 1
    default: 0
  - name: maxTokens
    use_template: max_tokens
    default: 600
    max: 4000
 pricing:
  input: '0.0156'
  output: '0.0156'
  unit: '0.0001'
  currency: USD
--- a/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-plus.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/cohere.command-r-plus.yaml
@ -50,3 +50,4 @@ pricing:
  output: '0.0219'
  unit: '0.0001'
  currency: USD
 deprecated: true
--- a/api/core/model_runtime/model_providers/oci/llm/llm.py
+++ b/api/core/model_runtime/model_providers/oci/llm/llm.py
@ -33,7 +33,7 @@ logger = logging.getLogger(__name__)
 request_template = {
    "compartmentId": "",
-    "servingMode": {"modelId": "cohere.command-r-plus", "servingType": "ON_DEMAND"},
+    "servingMode": {"modelId": "cohere.command-r-plus-08-2024", "servingType": "ON_DEMAND"},
    "chatRequest": {
        "apiFormat": "COHERE",
        # "preambleOverride": "You are a helpful assistant.",
@ -60,19 +60,19 @@ oci_config_template = {
 class OCILargeLanguageModel(LargeLanguageModel):
    # https://docs.oracle.com/en-us/iaas/Content/generative-ai/pretrained-models.htm
    _supported_models = {
-        "meta.llama-3-70b-instruct": {
+        "meta.llama-3.1-70b-instruct": {
            "system": True,
            "multimodal": False,
            "tool_call": False,
            "stream_tool_call": False,
        },
-        "cohere.command-r-16k": {
+        "cohere.command-r-08-2024": {
            "system": True,
            "multimodal": False,
            "tool_call": True,
            "stream_tool_call": False,
        },
-        "cohere.command-r-plus": {
+        "cohere.command-r-plus-08-2024": {
            "system": True,
            "multimodal": False,
            "tool_call": True,
--- a/api/core/model_runtime/model_providers/oci/llm/meta.llama-3-70b-instruct.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/meta.llama-3-70b-instruct.yaml
@ -49,3 +49,4 @@ pricing:
  output: '0.015'
  unit: '0.0001'
  currency: USD
 deprecated: true
--- a/api/core/model_runtime/model_providers/oci/llm/meta.llama-3.1-70b-instruct.yaml
+++ b/api/core/model_runtime/model_providers/oci/llm/meta.llama-3.1-70b-instruct.yaml
@ -0,0 +1,51 @@
 model: meta.llama-3.1-70b-instruct
 label:
  zh_Hans: meta.llama-3.1-70b-instruct
  en_US: meta.llama-3.1-70b-instruct
 model_type: llm
 features:
  - agent-thought
 model_properties:
  mode: chat
  context_size: 131072
 parameter_rules:
  - name: temperature
    use_template: temperature
    default: 1
    max: 2.0
  - name: topP
    use_template: top_p
    default: 0.75
    min: 0
    max: 1
  - name: topK
    label:
      zh_Hans: 取样数量
      en_US: Top k
    type: int
    help:
      zh_Hans: 仅从每个后续标记的前 K 个选项中采样。
      en_US: Only sample from the top K options for each subsequent token.
    required: false
    default: 0
    min: 0
    max: 500
  - name: presencePenalty
    use_template: presence_penalty
    min: -2
    max: 2
    default: 0
  - name: frequencyPenalty
    use_template: frequency_penalty
    min: -2
    max: 2
    default: 0
  - name: maxTokens
    use_template: max_tokens
    default: 600
    max: 4000
 pricing:
  input: '0.0075'
  output: '0.0075'
  unit: '0.0001'
  currency: USD
--- a/api/core/model_runtime/model_providers/oci/oci.py
+++ b/api/core/model_runtime/model_providers/oci/oci.py
@ -19,8 +19,8 @@ class OCIGENAIProvider(ModelProvider):
        try:
            model_instance = self.get_model_instance(ModelType.LLM)
-            # Use `cohere.command-r-plus` model for validate,
+            # Use `cohere.command-r-plus-08-2024` model for validate,
-            model_instance.validate_credentials(model="cohere.command-r-plus", credentials=credentials)
+            model_instance.validate_credentials(model="cohere.command-r-plus-08-2024", credentials=credentials)
        except CredentialsValidateFailedError as ex:
            raise ex
        except Exception as ex: