From 3242cf53846e35ded6363ab4a85d2c8adcad156a Mon Sep 17 00:00:00 2001 From: takatost Date: Tue, 6 Feb 2024 13:54:38 +0800 Subject: [PATCH] fix: moonshot context size error (#2406) --- api/core/model_runtime/model_providers/_position.yaml | 1 + .../model_providers/moonshot/llm/moonshot-v1-128k.yaml | 10 +++------- .../model_providers/moonshot/llm/moonshot-v1-32k.yaml | 10 +++------- .../model_providers/moonshot/llm/moonshot-v1-8k.yaml | 8 ++------ 4 files changed, 9 insertions(+), 20 deletions(-) diff --git a/api/core/model_runtime/model_providers/_position.yaml b/api/core/model_runtime/model_providers/_position.yaml index 9f7fe4c4f4..b2c6518395 100644 --- a/api/core/model_runtime/model_providers/_position.yaml +++ b/api/core/model_runtime/model_providers/_position.yaml @@ -14,6 +14,7 @@ - minimax - tongyi - wenxin +- moonshot - jina - chatglm - xinference diff --git a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-128k.yaml b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-128k.yaml index fe197b3cfd..28bfaed98a 100644 --- a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-128k.yaml +++ b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-128k.yaml @@ -7,21 +7,17 @@ features: - agent-thought model_properties: mode: chat - context_size: 4096 + context_size: 128000 parameter_rules: - name: temperature use_template: temperature - name: top_p use_template: top_p - - name: presence_penalty - use_template: presence_penalty - - name: frequency_penalty - use_template: frequency_penalty - name: max_tokens use_template: max_tokens - default: 512 + default: 1024 min: 1 - max: 4096 + max: 128000 pricing: input: '0.06' output: '0.06' diff --git a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-32k.yaml b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-32k.yaml index bc12ea5526..0df1a837f9 100644 --- a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-32k.yaml +++ b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-32k.yaml @@ -7,21 +7,17 @@ features: - agent-thought model_properties: mode: chat - context_size: 4096 + context_size: 32000 parameter_rules: - name: temperature use_template: temperature - name: top_p use_template: top_p - - name: presence_penalty - use_template: presence_penalty - - name: frequency_penalty - use_template: frequency_penalty - name: max_tokens use_template: max_tokens - default: 512 + default: 1024 min: 1 - max: 4096 + max: 32000 pricing: input: '0.024' output: '0.024' diff --git a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-8k.yaml b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-8k.yaml index 5643a72195..e4e0a0f069 100644 --- a/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-8k.yaml +++ b/api/core/model_runtime/model_providers/moonshot/llm/moonshot-v1-8k.yaml @@ -7,21 +7,17 @@ features: - agent-thought model_properties: mode: chat - context_size: 4096 + context_size: 8192 parameter_rules: - name: temperature use_template: temperature - name: top_p use_template: top_p - - name: presence_penalty - use_template: presence_penalty - - name: frequency_penalty - use_template: frequency_penalty - name: max_tokens use_template: max_tokens default: 512 min: 1 - max: 4096 + max: 8192 pricing: input: '0.012' output: '0.012'