Support new Claude-3.5 Sonnet max token limit (#6335)

This commit is contained in:
Richards Tu 2024-07-18 07:47:06 +08:00 committed by GitHub
parent f55876bcc5
commit 4782fb50c4
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 10 additions and 3 deletions

View File

@ -27,9 +27,9 @@ parameter_rules:
- name: max_tokens - name: max_tokens
use_template: max_tokens use_template: max_tokens
required: true required: true
default: 4096 default: 8192
min: 1 min: 1
max: 4096 max: 8192
- name: response_format - name: response_format
use_template: response_format use_template: response_format
pricing: pricing:

View File

@ -113,6 +113,11 @@ class AnthropicLargeLanguageModel(LargeLanguageModel):
if system: if system:
extra_model_kwargs['system'] = system extra_model_kwargs['system'] = system
# Add the new header for claude-3-5-sonnet-20240620 model
headers = {}
if model == "claude-3-5-sonnet-20240620":
headers["anthropic-beta"] = "max-tokens-3-5-sonnet-2024-07-15"
if tools: if tools:
extra_model_kwargs['tools'] = [ extra_model_kwargs['tools'] = [
self._transform_tool_prompt(tool) for tool in tools self._transform_tool_prompt(tool) for tool in tools
@ -121,6 +126,7 @@ class AnthropicLargeLanguageModel(LargeLanguageModel):
model=model, model=model,
messages=prompt_message_dicts, messages=prompt_message_dicts,
stream=stream, stream=stream,
headers=headers,
**model_parameters, **model_parameters,
**extra_model_kwargs **extra_model_kwargs
) )
@ -130,6 +136,7 @@ class AnthropicLargeLanguageModel(LargeLanguageModel):
model=model, model=model,
messages=prompt_message_dicts, messages=prompt_message_dicts,
stream=stream, stream=stream,
headers=headers,
**model_parameters, **model_parameters,
**extra_model_kwargs **extra_model_kwargs
) )