Add logic to handle whether a model supports temperature or not.
This commit is contained in:
parent
1c463fca17
commit
e3414890ff
|
|
@ -5,10 +5,11 @@ All notable changes to this project will be documented in this file.
|
||||||
The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
|
The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
|
||||||
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
|
and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
|
||||||
|
|
||||||
## [Unreleased]
|
## [0.13.1] - 2025-01-31
|
||||||
|
|
||||||
### Added
|
### Added
|
||||||
- WebUI (#61)
|
- WebUI (#61)
|
||||||
|
- Support o3-mini
|
||||||
|
|
||||||
### Changed
|
### Changed
|
||||||
- Convert list input to string to handle create-react-agent tool calls correctly (#66)
|
- Convert list input to string to handle create-react-agent tool calls correctly (#66)
|
||||||
|
|
|
||||||
|
|
@ -1,3 +1,3 @@
|
||||||
"""Version information."""
|
"""Version information."""
|
||||||
|
|
||||||
__version__ = "0.13.0"
|
__version__ = "0.13.1"
|
||||||
|
|
|
||||||
|
|
@ -1,6 +1,7 @@
|
||||||
import os
|
import os
|
||||||
from typing import Any, Dict, Optional
|
from typing import Any, Dict, Optional
|
||||||
|
|
||||||
|
from .models_params import models_params
|
||||||
from langchain_anthropic import ChatAnthropic
|
from langchain_anthropic import ChatAnthropic
|
||||||
from langchain_core.language_models import BaseChatModel
|
from langchain_core.language_models import BaseChatModel
|
||||||
from langchain_google_genai import ChatGoogleGenerativeAI
|
from langchain_google_genai import ChatGoogleGenerativeAI
|
||||||
|
|
@ -135,12 +136,16 @@ def create_llm_client(
|
||||||
is_expert,
|
is_expert,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
# Get model configuration
|
||||||
|
model_config = models_params.get(provider, {}).get(model_name, {})
|
||||||
|
supports_temperature = model_config.get("supports_temperature", False)
|
||||||
|
|
||||||
# Handle temperature settings
|
# Handle temperature settings
|
||||||
if is_expert:
|
if is_expert:
|
||||||
temp_kwargs = {"temperature": 0}
|
temp_kwargs = {"temperature": 0} if supports_temperature else {}
|
||||||
elif temperature is not None:
|
elif temperature is not None and supports_temperature:
|
||||||
temp_kwargs = {"temperature": temperature}
|
temp_kwargs = {"temperature": temperature}
|
||||||
elif provider == "openai-compatible":
|
elif provider == "openai-compatible" and supports_temperature:
|
||||||
temp_kwargs = {"temperature": 0.3}
|
temp_kwargs = {"temperature": 0.3}
|
||||||
else:
|
else:
|
||||||
temp_kwargs = {}
|
temp_kwargs = {}
|
||||||
|
|
|
||||||
|
|
@ -8,149 +8,149 @@ models_params = {
|
||||||
"openai": {
|
"openai": {
|
||||||
"gpt-3.5-turbo-0125": {
|
"gpt-3.5-turbo-0125": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5": {
|
"gpt-3.5": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo": {
|
"gpt-3.5-turbo": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo-1106": {
|
"gpt-3.5-turbo-1106": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo-instruct": {
|
"gpt-3.5-turbo-instruct": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-0125-preview": {
|
"gpt-4-0125-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo-preview": {
|
"gpt-4-turbo-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo": {
|
"gpt-4-turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo-2024-04-09": {
|
"gpt-4-turbo-2024-04-09": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-1106-preview": {
|
"gpt-4-1106-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-vision-preview": {
|
"gpt-4-vision-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4": {
|
"gpt-4": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-0613": {
|
"gpt-4-0613": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-32k": {
|
"gpt-4-32k": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-32k-0613": {
|
"gpt-4-32k-0613": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4o": {
|
"gpt-4o": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4o-2024-08-06": {
|
"gpt-4o-2024-08-06": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4o-2024-05-13": {
|
"gpt-4o-2024-05-13": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4o-mini": {
|
"gpt-4o-mini": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"o1-preview": {
|
"o1-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": True
|
"supports_temperature": False
|
||||||
},
|
},
|
||||||
"o1-mini": {
|
"o1-mini": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": True
|
"supports_temperature": False
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"azure_openai": {
|
"azure_openai": {
|
||||||
"gpt-3.5-turbo-0125": {
|
"gpt-3.5-turbo-0125": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5": {
|
"gpt-3.5": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo": {
|
"gpt-3.5-turbo": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo-1106": {
|
"gpt-3.5-turbo-1106": {
|
||||||
"token_limit": 16385,
|
"token_limit": 16385,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-3.5-turbo-instruct": {
|
"gpt-3.5-turbo-instruct": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-0125-preview": {
|
"gpt-4-0125-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo-preview": {
|
"gpt-4-turbo-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo": {
|
"gpt-4-turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-turbo-2024-04-09": {
|
"gpt-4-turbo-2024-04-09": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-1106-preview": {
|
"gpt-4-1106-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-vision-preview": {
|
"gpt-4-vision-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4": {
|
"gpt-4": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-0613": {
|
"gpt-4-0613": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-32k": {
|
"gpt-4-32k": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4-32k-0613": {
|
"gpt-4-32k-0613": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gpt-4o": {
|
"gpt-4o": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
|
|
@ -166,550 +166,550 @@ models_params = {
|
||||||
},
|
},
|
||||||
"o1-preview": {
|
"o1-preview": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": True
|
"supports_temperature": False
|
||||||
},
|
},
|
||||||
"o1-mini": {
|
"o1-mini": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": True
|
"supports_temperature": False
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"google_genai": {
|
"google_genai": {
|
||||||
"gemini-pro": {
|
"gemini-pro": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemini-1.5-flash-latest": {
|
"gemini-1.5-flash-latest": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemini-1.5-pro-latest": {
|
"gemini-1.5-pro-latest": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"models/embedding-001": {
|
"models/embedding-001": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"google_vertexai": {
|
"google_vertexai": {
|
||||||
"gemini-1.5-flash": {
|
"gemini-1.5-flash": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemini-1.5-pro": {
|
"gemini-1.5-pro": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemini-1.0-pro": {
|
"gemini-1.0-pro": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"ollama": {
|
"ollama": {
|
||||||
"command-r": {
|
"command-r": {
|
||||||
"token_limit": 12800,
|
"token_limit": 12800,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"codellama": {
|
"codellama": {
|
||||||
"token_limit": 16000,
|
"token_limit": 16000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"dbrx": {
|
"dbrx": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"deepseek-coder:33b": {
|
"deepseek-coder:33b": {
|
||||||
"token_limit": 16000,
|
"token_limit": 16000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"falcon": {
|
"falcon": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama2": {
|
"llama2": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama2:7b": {
|
"llama2:7b": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama2:13b": {
|
"llama2:13b": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama2:70b": {
|
"llama2:70b": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3": {
|
"llama3": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3:8b": {
|
"llama3:8b": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3:70b": {
|
"llama3:70b": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.1": {
|
"llama3.1": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.1:8b": {
|
"llama3.1:8b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.1:70b": {
|
"llama3.1:70b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"lama3.1:405b": {
|
"lama3.1:405b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.2": {
|
"llama3.2": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.2:1b": {
|
"llama3.2:1b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.2:3b": {
|
"llama3.2:3b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3.3:70b": {
|
"llama3.3:70b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"scrapegraph": {
|
"scrapegraph": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral-small": {
|
"mistral-small": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral-openorca": {
|
"mistral-openorca": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral-large": {
|
"mistral-large": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"grok-1": {
|
"grok-1": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llava": {
|
"llava": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mixtral:8x22b-instruct": {
|
"mixtral:8x22b-instruct": {
|
||||||
"token_limit": 65536,
|
"token_limit": 65536,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"nomic-embed-text": {
|
"nomic-embed-text": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"nous-hermes2:34b": {
|
"nous-hermes2:34b": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"orca-mini": {
|
"orca-mini": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"phi3:3.8b": {
|
"phi3:3.8b": {
|
||||||
"token_limit": 12800,
|
"token_limit": 12800,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"phi3:14b": {
|
"phi3:14b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:0.5b": {
|
"qwen:0.5b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:1.8b": {
|
"qwen:1.8b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:4b": {
|
"qwen:4b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:14b": {
|
"qwen:14b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:32b": {
|
"qwen:32b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:72b": {
|
"qwen:72b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"qwen:110b": {
|
"qwen:110b": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"stablelm-zephyr": {
|
"stablelm-zephyr": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"wizardlm2:8x22b": {
|
"wizardlm2:8x22b": {
|
||||||
"token_limit": 65536,
|
"token_limit": 65536,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral": {
|
"mistral": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemma2": {
|
"gemma2": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemma2:9b": {
|
"gemma2:9b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemma2:27b": {
|
"gemma2:27b": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
# embedding models
|
# embedding models
|
||||||
"shaw/dmeta-embedding-zh-small-q4": {
|
"shaw/dmeta-embedding-zh-small-q4": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"shaw/dmeta-embedding-zh-q4": {
|
"shaw/dmeta-embedding-zh-q4": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"chevalblanc/acge_text_embedding": {
|
"chevalblanc/acge_text_embedding": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"martcreation/dmeta-embedding-zh": {
|
"martcreation/dmeta-embedding-zh": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"snowflake-arctic-embed": {
|
"snowflake-arctic-embed": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mxbai-embed-large": {
|
"mxbai-embed-large": {
|
||||||
"token_limit": 512,
|
"token_limit": 512,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"oneapi": {
|
"oneapi": {
|
||||||
"qwen-turbo": {
|
"qwen-turbo": {
|
||||||
"token_limit": 6000,
|
"token_limit": 6000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"nvidia": {
|
"nvidia": {
|
||||||
"meta/llama3-70b-instruct": {
|
"meta/llama3-70b-instruct": {
|
||||||
"token_limit": 419,
|
"token_limit": 419,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta/llama3-8b-instruct": {
|
"meta/llama3-8b-instruct": {
|
||||||
"token_limit": 419,
|
"token_limit": 419,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"nemotron-4-340b-instruct": {
|
"nemotron-4-340b-instruct": {
|
||||||
"token_limit": 1024,
|
"token_limit": 1024,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"databricks/dbrx-instruct": {
|
"databricks/dbrx-instruct": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"google/codegemma-7b": {
|
"google/codegemma-7b": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"google/gemma-2b": {
|
"google/gemma-2b": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"google/gemma-7b": {
|
"google/gemma-7b": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"google/recurrentgemma-2b": {
|
"google/recurrentgemma-2b": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta/codellama-70b": {
|
"meta/codellama-70b": {
|
||||||
"token_limit": 16384,
|
"token_limit": 16384,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta/llama2-70b": {
|
"meta/llama2-70b": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"microsoft/phi-3-mini-128k-instruct": {
|
"microsoft/phi-3-mini-128k-instruct": {
|
||||||
"token_limit": 122880,
|
"token_limit": 122880,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistralai/mistral-7b-instruct-v0.2": {
|
"mistralai/mistral-7b-instruct-v0.2": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistralai/mistral-large": {
|
"mistralai/mistral-large": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistralai/mixtral-8x22b-instruct-v0.1": {
|
"mistralai/mixtral-8x22b-instruct-v0.1": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistralai/mixtral-8x7b-instruct-v0.1": {
|
"mistralai/mixtral-8x7b-instruct-v0.1": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"snowflake/arctic": {
|
"snowflake/arctic": {
|
||||||
"token_limit": 16384,
|
"token_limit": 16384,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"groq": {
|
"groq": {
|
||||||
"llama3-8b-8192": {
|
"llama3-8b-8192": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"llama3-70b-8192": {
|
"llama3-70b-8192": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mixtral-8x7b-32768": {
|
"mixtral-8x7b-32768": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"gemma-7b-it": {
|
"gemma-7b-it": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-haiku-20240307'": {
|
"claude-3-haiku-20240307'": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"toghetherai": {
|
"toghetherai": {
|
||||||
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
|
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
|
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistralai/Mixtral-8x22B-Instruct-v0.1": {
|
"mistralai/Mixtral-8x22B-Instruct-v0.1": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"stabilityai/stable-diffusion-xl-base-1.0": {
|
"stabilityai/stable-diffusion-xl-base-1.0": {
|
||||||
"token_limit": 2048,
|
"token_limit": 2048,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": {
|
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"NousResearch/Hermes-3-Llama-3.1-405B-Turbo": {
|
"NousResearch/Hermes-3-Llama-3.1-405B-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"Gryphe/MythoMax-L2-13b-Lite": {
|
"Gryphe/MythoMax-L2-13b-Lite": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"Salesforce/Llama-Rank-V1": {
|
"Salesforce/Llama-Rank-V1": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Meta-Llama-Guard-3-8B": {
|
"meta-llama/Meta-Llama-Guard-3-8B": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Meta-Llama-3-70B-Instruct-Turbo": {
|
"meta-llama/Meta-Llama-3-70B-Instruct-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Llama-3-8b-chat-hf": {
|
"meta-llama/Llama-3-8b-chat-hf": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta-llama/Llama-3-70b-chat-hf": {
|
"meta-llama/Llama-3-70b-chat-hf": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"Qwen/Qwen2-72B-Instruct": {
|
"Qwen/Qwen2-72B-Instruct": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"google/gemma-2-27b-it": {
|
"google/gemma-2-27b-it": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"anthropic": {
|
"anthropic": {
|
||||||
"claude_instant": {
|
"claude_instant": {
|
||||||
"token_limit": 100000,
|
"token_limit": 100000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude2": {
|
"claude2": {
|
||||||
"token_limit": 9000,
|
"token_limit": 9000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude2.1": {
|
"claude2.1": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude3": {
|
"claude3": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude3.5": {
|
"claude3.5": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-opus-20240229": {
|
"claude-3-opus-20240229": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-sonnet-20240229": {
|
"claude-3-sonnet-20240229": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-haiku-20240307": {
|
"claude-3-haiku-20240307": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-5-sonnet-20240620": {
|
"claude-3-5-sonnet-20240620": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-5-sonnet-20241022": {
|
"claude-3-5-sonnet-20241022": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-5-haiku-latest": {
|
"claude-3-5-haiku-latest": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"bedrock": {
|
"bedrock": {
|
||||||
"anthropic.claude-3-haiku-20240307-v1:0": {
|
"anthropic.claude-3-haiku-20240307-v1:0": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-3-sonnet-20240229-v1:0": {
|
"anthropic.claude-3-sonnet-20240229-v1:0": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-3-opus-20240229-v1:0": {
|
"anthropic.claude-3-opus-20240229-v1:0": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-3-5-sonnet-20240620-v1:0": {
|
"anthropic.claude-3-5-sonnet-20240620-v1:0": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"claude-3-5-haiku-latest": {
|
"claude-3-5-haiku-latest": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-v2:1": {
|
"anthropic.claude-v2:1": {
|
||||||
"token_limit": 200000,
|
"token_limit": 200000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-v2": {
|
"anthropic.claude-v2": {
|
||||||
"token_limit": 100000,
|
"token_limit": 100000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"anthropic.claude-instant-v1": {
|
"anthropic.claude-instant-v1": {
|
||||||
"token_limit": 100000,
|
"token_limit": 100000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta.llama3-8b-instruct-v1:0": {
|
"meta.llama3-8b-instruct-v1:0": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta.llama3-70b-instruct-v1:0": {
|
"meta.llama3-70b-instruct-v1:0": {
|
||||||
"token_limit": 8192,
|
"token_limit": 8192,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta.llama2-13b-chat-v1": {
|
"meta.llama2-13b-chat-v1": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"meta.llama2-70b-chat-v1": {
|
"meta.llama2-70b-chat-v1": {
|
||||||
"token_limit": 4096,
|
"token_limit": 4096,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral.mistral-7b-instruct-v0:2": {
|
"mistral.mistral-7b-instruct-v0:2": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral.mixtral-8x7b-instruct-v0:1": {
|
"mistral.mixtral-8x7b-instruct-v0:1": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral.mistral-large-2402-v1:0": {
|
"mistral.mistral-large-2402-v1:0": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"mistral.mistral-small-2402-v1:0": {
|
"mistral.mistral-small-2402-v1:0": {
|
||||||
"token_limit": 32768,
|
"token_limit": 32768,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"amazon.titan-embed-text-v1": {
|
"amazon.titan-embed-text-v1": {
|
||||||
"token_limit": 8000,
|
"token_limit": 8000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"amazon.titan-embed-text-v2:0": {
|
"amazon.titan-embed-text-v2:0": {
|
||||||
"token_limit": 8000,
|
"token_limit": 8000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"cohere.embed-english-v3": {
|
"cohere.embed-english-v3": {
|
||||||
"token_limit": 512,
|
"token_limit": 512,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"cohere.embed-multilingual-v3": {
|
"cohere.embed-multilingual-v3": {
|
||||||
"token_limit": 512,
|
"token_limit": 512,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"mistralai": {
|
"mistralai": {
|
||||||
"mistral-large-latest": {
|
"mistral-large-latest": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"open-mistral-nemo": {
|
"open-mistral-nemo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
},
|
},
|
||||||
"codestral-latest": {
|
"codestral-latest": {
|
||||||
"token_limit": 32000,
|
"token_limit": 32000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"togetherai": {
|
"togetherai": {
|
||||||
"Meta-Llama-3.1-70B-Instruct-Turbo": {
|
"Meta-Llama-3.1-70B-Instruct-Turbo": {
|
||||||
"token_limit": 128000,
|
"token_limit": 128000,
|
||||||
"supports_temperature": False
|
"supports_temperature": True
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue