From 820a0ded9c8b8a09295849fe94bb13165fade236 Mon Sep 17 00:00:00 2001 From: Zachary Loeber Date: Sun, 3 Aug 2025 12:54:00 -0500 Subject: [PATCH 1/4] feature: add ollama provider based partially on json output generated in https://ollama-models.zwz.workers.dev/ --- internal/providers/configs/ollama.json | 2123 ++++++++++++++++++++++++ internal/providers/providers.go | 7 + 2 files changed, 2130 insertions(+) create mode 100644 internal/providers/configs/ollama.json diff --git a/internal/providers/configs/ollama.json b/internal/providers/configs/ollama.json new file mode 100644 index 00000000..b79fe6ef --- /dev/null +++ b/internal/providers/configs/ollama.json @@ -0,0 +1,2123 @@ +{ + "name": "Ollama", + "id": "ollama", + "type": "openai", + "api_key": "ollama", + "api_endpoint": "$OLLAMA_API_ENDPOINT", + "default_large_model_id": "deepseek-r1", + "default_small_model_id": "llama3", + "models": [ + { + "id": "deepseek-r1", + "name": "deepseek-r1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "gemma3n", + "name": "gemma3n", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "gemma3", + "name": "gemma3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen3", + "name": "qwen3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2.5vl", + "name": "qwen2.5vl", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": true + }, + { + "id": "llama3.1", + "name": "llama3.1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "nomic-embed-text", + "name": "nomic-embed-text", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3.2", + "name": "llama3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "mistral", + "name": "mistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2.5", + "name": "qwen2.5", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3", + "name": "llama3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llava", + "name": "llava", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "phi3", + "name": "phi3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "gemma2", + "name": "gemma2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2.5-coder", + "name": "qwen2.5-coder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "gemma", + "name": "gemma", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen", + "name": "qwen", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mxbai-embed-large", + "name": "mxbai-embed-large", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2", + "name": "qwen2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama2", + "name": "llama2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi4", + "name": "phi4", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "minicpm-v", + "name": "minicpm-v", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 1800, + "default_max_tokens": 1800, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "codellama", + "name": "codellama", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": "100000", + "default_max_tokens": "100000", + "can_reason": false, + "supports_attachments": false + }, + { + "id": "tinyllama", + "name": "tinyllama", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3.3", + "name": "llama3.3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "llama3.2-vision", + "name": "llama3.2-vision", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "dolphin3", + "name": "dolphin3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-nemo", + "name": "mistral-nemo", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "olmo2", + "name": "olmo2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "deepseek-v3", + "name": "deepseek-v3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "bge-m3", + "name": "bge-m3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "qwq", + "name": "qwq", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small", + "name": "mistral-small", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llava-llama3", + "name": "llava-llama3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "smollm2", + "name": "smollm2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama2-uncensored", + "name": "llama2-uncensored", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mixtral", + "name": "mixtral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "starcoder2", + "name": "starcoder2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 16384, + "default_max_tokens": 16384, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "all-minilm", + "name": "all-minilm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "deepseek-coder-v2", + "name": "deepseek-coder-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "deepseek-coder", + "name": "deepseek-coder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 16000, + "default_max_tokens": 16000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "snowflake-arctic-embed", + "name": "snowflake-arctic-embed", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "codegemma", + "name": "codegemma", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi", + "name": "phi", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "dolphin-mixtral", + "name": "dolphin-mixtral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "openthinker", + "name": "openthinker", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32768, + "default_max_tokens": 32768, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama4", + "name": "llama4", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 10000000, + "default_max_tokens": 10000000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "orca-mini", + "name": "orca-mini", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizardlm2", + "name": "wizardlm2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "smollm", + "name": "smollm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "dolphin-mistral", + "name": "dolphin-mistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "codestral", + "name": "codestral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "dolphin-llama3", + "name": "dolphin-llama3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r", + "name": "command-r", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "hermes3", + "name": "hermes3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi3.5", + "name": "phi3.5", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "yi", + "name": "yi", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "zephyr", + "name": "zephyr", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.3", + "name": "granite3.3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi4-mini", + "name": "phi4-mini", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "moondream", + "name": "moondream", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "granite-code", + "name": "granite-code", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizard-vicuna-uncensored", + "name": "wizard-vicuna-uncensored", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "magistral", + "name": "magistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 40000, + "default_max_tokens": 40000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "devstral", + "name": "devstral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi4-reasoning", + "name": "phi4-reasoning", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "starcoder", + "name": "starcoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "cogito", + "name": "cogito", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small3.1", + "name": "mistral-small3.1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "deepcoder", + "name": "deepcoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "vicuna", + "name": "vicuna", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "openchat", + "name": "openchat", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-openorca", + "name": "mistral-openorca", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "codegeex4", + "name": "codegeex4", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "deepseek-llm", + "name": "deepseek-llm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "deepseek-v2", + "name": "deepseek-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "openhermes", + "name": "openhermes", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.2-vision", + "name": "granite3.2-vision", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "codeqwen", + "name": "codeqwen", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": "64000", + "default_max_tokens": "64000", + "can_reason": false, + "supports_attachments": false + }, + { + "id": "mistral-large", + "name": "mistral-large", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama2-chinese", + "name": "llama2-chinese", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "aya", + "name": "aya", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "tinydolphin", + "name": "tinydolphin", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "glm4", + "name": "glm4", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2-math", + "name": "qwen2-math", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "stable-code", + "name": "stable-code", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 16384, + "default_max_tokens": 16384, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "nous-hermes2", + "name": "nous-hermes2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizardcoder", + "name": "wizardcoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r-plus", + "name": "command-r-plus", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "bakllava", + "name": "bakllava", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "neural-chat", + "name": "neural-chat", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.2", + "name": "granite3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "stablelm2", + "name": "stablelm2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "bge-large", + "name": "bge-large", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "sqlcoder", + "name": "sqlcoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3-chatqa", + "name": "llama3-chatqa", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "snowflake-arctic-embed2", + "name": "snowflake-arctic-embed2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "reflection", + "name": "reflection", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizard-math", + "name": "wizard-math", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llava-phi3", + "name": "llava-phi3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "nous-hermes", + "name": "nous-hermes", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.1-dense", + "name": "granite3.1-dense", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3-dense", + "name": "granite3-dense", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3-gradient", + "name": "llama3-gradient", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "dbrx", + "name": "dbrx", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": "32768", + "default_max_tokens": "32768", + "can_reason": true, + "supports_attachments": false + }, + { + "id": "exaone3.5", + "name": "exaone3.5", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "samantha-mistral", + "name": "samantha-mistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "yi-coder", + "name": "yi-coder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "falcon", + "name": "falcon", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "dolphincoder", + "name": "dolphincoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nemotron-mini", + "name": "nemotron-mini", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "starling-lm", + "name": "starling-lm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "deepscaler", + "name": "deepscaler", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "phind-codellama", + "name": "phind-codellama", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 16000, + "default_max_tokens": 16000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "solar", + "name": "solar", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "xwinlm", + "name": "xwinlm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "internlm2", + "name": "internlm2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "athene-v2", + "name": "athene-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "opencoder", + "name": "opencoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "dolphin-phi", + "name": "dolphin-phi", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nemotron", + "name": "nemotron", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "yarn-llama2", + "name": "yarn-llama2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "exaone-deep", + "name": "exaone-deep", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3-groq-tool-use", + "name": "llama3-groq-tool-use", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizardlm", + "name": "wizardlm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small3.2", + "name": "mistral-small3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 24000, + "default_max_tokens": 24000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "paraphrase-multilingual", + "name": "paraphrase-multilingual", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "falcon3", + "name": "falcon3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizardlm-uncensored", + "name": "wizardlm-uncensored", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "aya-expanse", + "name": "aya-expanse", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "orca2", + "name": "orca2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "smallthinker", + "name": "smallthinker", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama-guard3", + "name": "llama-guard3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite-embedding", + "name": "granite-embedding", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 512, + "default_max_tokens": 512, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "medllama2", + "name": "medllama2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nous-hermes2-mixtral", + "name": "nous-hermes2-mixtral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "stable-beluga", + "name": "stable-beluga", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "meditron", + "name": "meditron", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3-moe", + "name": "granite3-moe", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "r1-1776", + "name": "r1-1776", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.1-moe", + "name": "granite3.1-moe", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "deepseek-v2.5", + "name": "deepseek-v2.5", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "reader-lm", + "name": "reader-lm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama-pro", + "name": "llama-pro", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "yarn-mistral", + "name": "yarn-mistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "shieldgemma", + "name": "shieldgemma", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nexusraven", + "name": "nexusraven", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r7b", + "name": "command-r7b", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mathstral", + "name": "mathstral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "everythinglm", + "name": "everythinglm", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 16384, + "default_max_tokens": 16384, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "codeup", + "name": "codeup", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "marco-o1", + "name": "marco-o1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "stablelm-zephyr", + "name": "stablelm-zephyr", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "tulu3", + "name": "tulu3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "solar-pro", + "name": "solar-pro", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "duckdb-nsql", + "name": "duckdb-nsql", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi4-mini-reasoning", + "name": "phi4-mini-reasoning", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "falcon2", + "name": "falcon2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "magicoder", + "name": "magicoder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistrallite", + "name": "mistrallite", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "codebooga", + "name": "codebooga", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "bespoke-minicheck", + "name": "bespoke-minicheck", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "wizard-vicuna", + "name": "wizard-vicuna", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nuextract", + "name": "nuextract", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3-guardian", + "name": "granite3-guardian", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "megadolphin", + "name": "megadolphin", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "notux", + "name": "notux", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "open-orca-platypus2", + "name": "open-orca-platypus2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "notus", + "name": "notus", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-a", + "name": "command-a", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 256000, + "default_max_tokens": 256000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "goliath", + "name": "goliath", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "sailor2", + "name": "sailor2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "firefunction-v2", + "name": "firefunction-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "alfred", + "name": "alfred", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "qwen3-coder", + "name": "qwen3-coder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r7b-arabic", + "name": "command-r7b-arabic", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + } + ] +} diff --git a/internal/providers/providers.go b/internal/providers/providers.go index 0d89ba16..3d669abf 100644 --- a/internal/providers/providers.go +++ b/internal/providers/providers.go @@ -36,6 +36,8 @@ var bedrockConfig []byte //go:embed configs/groq.json var groqConfig []byte +var ollamaConfig []byte + // ProviderFunc is a function that returns a Provider. type ProviderFunc func() catwalk.Provider @@ -49,6 +51,7 @@ var providerRegistry = []ProviderFunc{ xAIProvider, groqProvider, openRouterProvider, + ollamaProvider, } // GetAll returns all registered providers. @@ -104,3 +107,7 @@ func openRouterProvider() catwalk.Provider { func groqProvider() catwalk.Provider { return loadProviderFromConfig(groqConfig) } + +func ollamaProvider() catwalk.Provider { + return loadProviderFromConfig(ollamaConfig) +} From 56e26acbe41472cbef1f477d1879104db97ccd39 Mon Sep 17 00:00:00 2001 From: Zachary Loeber Date: Sun, 3 Aug 2025 13:14:16 -0500 Subject: [PATCH 2/4] fix: Remove any models without tools support --- internal/providers/configs/ollama.json | 1944 ++---------------------- internal/providers/new_models.json | 412 +++++ 2 files changed, 533 insertions(+), 1823 deletions(-) create mode 100644 internal/providers/new_models.json diff --git a/internal/providers/configs/ollama.json b/internal/providers/configs/ollama.json index b79fe6ef..60cd0ac5 100644 --- a/internal/providers/configs/ollama.json +++ b/internal/providers/configs/ollama.json @@ -12,92 +12,36 @@ "name": "deepseek-r1", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, - { - "id": "gemma3n", - "name": "gemma3n", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "gemma3", - "name": "gemma3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, { "id": "qwen3", "name": "qwen3", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, - { - "id": "qwen2.5vl", - "name": "qwen2.5vl", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": true - }, { "id": "llama3.1", "name": "llama3.1", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": false, "supports_attachments": false }, - { - "id": "nomic-embed-text", - "name": "nomic-embed-text", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, { "id": "llama3.2", "name": "llama3.2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": false, @@ -108,8 +52,6 @@ "name": "mistral", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 32000, "default_max_tokens": 32000, "can_reason": true, @@ -120,2000 +62,356 @@ "name": "qwen2.5", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "llama3", - "name": "llama3", + "id": "qwen2.5-coder", + "name": "qwen2.5-coder", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "llava", - "name": "llava", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "phi3", - "name": "phi3", + "id": "qwen2", + "name": "qwen2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "gemma2", - "name": "gemma2", + "id": "llama3.3", + "name": "llama3.3", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 8192, "default_max_tokens": 8192, - "can_reason": true, + "can_reason": false, "supports_attachments": false }, { - "id": "qwen2.5-coder", - "name": "qwen2.5-coder", + "id": "mistral-nemo", + "name": "mistral-nemo", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "gemma", - "name": "gemma", + "id": "qwq", + "name": "qwq", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 8192, "default_max_tokens": 8192, "can_reason": true, "supports_attachments": false }, { - "id": "qwen", - "name": "qwen", + "id": "mistral-small", + "name": "mistral-small", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, + "context_window": 32000, + "default_max_tokens": 32000, "can_reason": true, "supports_attachments": false }, { - "id": "mxbai-embed-large", - "name": "mxbai-embed-large", + "id": "smollm2", + "name": "smollm2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, + "context_window": 2048, + "default_max_tokens": 2048, "can_reason": true, "supports_attachments": false }, { - "id": "qwen2", - "name": "qwen2", + "id": "mixtral", + "name": "mixtral", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, + "context_window": 32000, + "default_max_tokens": 32000, "can_reason": true, "supports_attachments": false }, { - "id": "llama2", - "name": "llama2", + "id": "llama4", + "name": "llama4", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, + "context_window": 10000000, + "default_max_tokens": 10000000, "can_reason": true, "supports_attachments": false }, { - "id": "phi4", - "name": "phi4", + "id": "command-r", + "name": "command-r", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "minicpm-v", - "name": "minicpm-v", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 1800, - "default_max_tokens": 1800, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "codellama", - "name": "codellama", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": "100000", - "default_max_tokens": "100000", - "can_reason": false, - "supports_attachments": false - }, - { - "id": "tinyllama", - "name": "tinyllama", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3.3", - "name": "llama3.3", + "id": "hermes3", + "name": "hermes3", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 8192, "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "llama3.2-vision", - "name": "llama3.2-vision", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, "can_reason": true, - "supports_attachments": true + "supports_attachments": false }, { - "id": "dolphin3", - "name": "dolphin3", + "id": "granite3.3", + "name": "granite3.3", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 8192, "default_max_tokens": 8192, "can_reason": true, "supports_attachments": false }, { - "id": "mistral-nemo", - "name": "mistral-nemo", + "id": "phi4-mini", + "name": "phi4-mini", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "olmo2", - "name": "olmo2", + "id": "magistral", + "name": "magistral", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, + "context_window": 40000, + "default_max_tokens": 40000, "can_reason": true, "supports_attachments": false }, { - "id": "deepseek-v3", - "name": "deepseek-v3", + "id": "devstral", + "name": "devstral", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "bge-m3", - "name": "bge-m3", + "id": "cogito", + "name": "cogito", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": false, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, "supports_attachments": false }, { - "id": "qwq", - "name": "qwq", + "id": "mistral-small3.1", + "name": "mistral-small3.1", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, - "supports_attachments": false + "supports_attachments": true }, { - "id": "mistral-small", - "name": "mistral-small", + "id": "granite3.2-vision", + "name": "granite3.2-vision", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 32000, "default_max_tokens": 32000, "can_reason": true, - "supports_attachments": false - }, - { - "id": "llava-llama3", - "name": "llava-llama3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, "supports_attachments": true }, { - "id": "smollm2", - "name": "smollm2", + "id": "mistral-large", + "name": "mistral-large", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "llama2-uncensored", - "name": "llama2-uncensored", + "id": "command-r-plus", + "name": "command-r-plus", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "mixtral", - "name": "mixtral", + "id": "granite3.2", + "name": "granite3.2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "starcoder2", - "name": "starcoder2", + "id": "granite3.1-dense", + "name": "granite3.1-dense", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 16384, - "default_max_tokens": 16384, + "context_window": 2048, + "default_max_tokens": 2048, "can_reason": true, "supports_attachments": false }, { - "id": "all-minilm", - "name": "all-minilm", + "id": "granite3-dense", + "name": "granite3-dense", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, - "can_reason": false, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, "supports_attachments": false }, { - "id": "deepseek-coder-v2", - "name": "deepseek-coder-v2", + "id": "nemotron-mini", + "name": "nemotron-mini", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, + "context_window": 4096, + "default_max_tokens": 4096, "can_reason": true, "supports_attachments": false }, { - "id": "deepseek-coder", - "name": "deepseek-coder", + "id": "athene-v2", + "name": "athene-v2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 16000, - "default_max_tokens": 16000, - "can_reason": true, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": false, "supports_attachments": false }, { - "id": "snowflake-arctic-embed", - "name": "snowflake-arctic-embed", + "id": "nemotron", + "name": "nemotron", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, + "context_window": 4096, + "default_max_tokens": 4096, "can_reason": true, "supports_attachments": false }, { - "id": "codegemma", - "name": "codegemma", + "id": "llama3-groq-tool-use", + "name": "llama3-groq-tool-use", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 8192, "default_max_tokens": 8192, "can_reason": true, "supports_attachments": false }, { - "id": "phi", - "name": "phi", + "id": "mistral-small3.2", + "name": "mistral-small3.2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, + "context_window": 24000, + "default_max_tokens": 24000, "can_reason": true, "supports_attachments": false }, { - "id": "dolphin-mixtral", - "name": "dolphin-mixtral", + "id": "aya-expanse", + "name": "aya-expanse", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, "supports_attachments": false }, { - "id": "openthinker", - "name": "openthinker", + "id": "granite3-moe", + "name": "granite3-moe", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 32768, + "context_window": 2048, + "default_max_tokens": 2048, "can_reason": true, "supports_attachments": false }, { - "id": "llama4", - "name": "llama4", + "id": "granite3.1-moe", + "name": "granite3.1-moe", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 10000000, - "default_max_tokens": 10000000, + "context_window": 2048, + "default_max_tokens": 2048, "can_reason": true, "supports_attachments": false }, { - "id": "orca-mini", - "name": "orca-mini", + "id": "command-r7b", + "name": "command-r7b", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, + "context_window": 128000, + "default_max_tokens": 128000, "can_reason": true, "supports_attachments": false }, { - "id": "wizardlm2", - "name": "wizardlm2", + "id": "command-a", + "name": "command-a", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, + "context_window": 256000, + "default_max_tokens": 256000, "can_reason": true, "supports_attachments": false }, { - "id": "smollm", - "name": "smollm", + "id": "firefunction-v2", + "name": "firefunction-v2", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 2048, "default_max_tokens": 2048, "can_reason": true, "supports_attachments": false }, - { - "id": "dolphin-mistral", - "name": "dolphin-mistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "codestral", - "name": "codestral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "dolphin-llama3", - "name": "dolphin-llama3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r", - "name": "command-r", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "hermes3", - "name": "hermes3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "phi3.5", - "name": "phi3.5", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "yi", - "name": "yi", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "zephyr", - "name": "zephyr", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.3", - "name": "granite3.3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "phi4-mini", - "name": "phi4-mini", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "moondream", - "name": "moondream", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "granite-code", - "name": "granite-code", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizard-vicuna-uncensored", - "name": "wizard-vicuna-uncensored", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "magistral", - "name": "magistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 40000, - "default_max_tokens": 40000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "devstral", - "name": "devstral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "phi4-reasoning", - "name": "phi4-reasoning", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "starcoder", - "name": "starcoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "cogito", - "name": "cogito", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-small3.1", - "name": "mistral-small3.1", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "deepcoder", - "name": "deepcoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "vicuna", - "name": "vicuna", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "openchat", - "name": "openchat", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-openorca", - "name": "mistral-openorca", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "codegeex4", - "name": "codegeex4", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "deepseek-llm", - "name": "deepseek-llm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "deepseek-v2", - "name": "deepseek-v2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "openhermes", - "name": "openhermes", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.2-vision", - "name": "granite3.2-vision", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "codeqwen", - "name": "codeqwen", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": "64000", - "default_max_tokens": "64000", - "can_reason": false, - "supports_attachments": false - }, - { - "id": "mistral-large", - "name": "mistral-large", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama2-chinese", - "name": "llama2-chinese", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "aya", - "name": "aya", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "tinydolphin", - "name": "tinydolphin", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "glm4", - "name": "glm4", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwen2-math", - "name": "qwen2-math", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "stable-code", - "name": "stable-code", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 16384, - "default_max_tokens": 16384, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "nous-hermes2", - "name": "nous-hermes2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizardcoder", - "name": "wizardcoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r-plus", - "name": "command-r-plus", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "bakllava", - "name": "bakllava", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "neural-chat", - "name": "neural-chat", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.2", - "name": "granite3.2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "stablelm2", - "name": "stablelm2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "bge-large", - "name": "bge-large", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "sqlcoder", - "name": "sqlcoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3-chatqa", - "name": "llama3-chatqa", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "snowflake-arctic-embed2", - "name": "snowflake-arctic-embed2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "reflection", - "name": "reflection", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizard-math", - "name": "wizard-math", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llava-phi3", - "name": "llava-phi3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "nous-hermes", - "name": "nous-hermes", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.1-dense", - "name": "granite3.1-dense", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3-dense", - "name": "granite3-dense", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3-gradient", - "name": "llama3-gradient", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "dbrx", - "name": "dbrx", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": "32768", - "default_max_tokens": "32768", - "can_reason": true, - "supports_attachments": false - }, - { - "id": "exaone3.5", - "name": "exaone3.5", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "samantha-mistral", - "name": "samantha-mistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "yi-coder", - "name": "yi-coder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "falcon", - "name": "falcon", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "dolphincoder", - "name": "dolphincoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nemotron-mini", - "name": "nemotron-mini", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "starling-lm", - "name": "starling-lm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "deepscaler", - "name": "deepscaler", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "phind-codellama", - "name": "phind-codellama", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 16000, - "default_max_tokens": 16000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "solar", - "name": "solar", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "xwinlm", - "name": "xwinlm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "internlm2", - "name": "internlm2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "athene-v2", - "name": "athene-v2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "opencoder", - "name": "opencoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "dolphin-phi", - "name": "dolphin-phi", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nemotron", - "name": "nemotron", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "yarn-llama2", - "name": "yarn-llama2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "exaone-deep", - "name": "exaone-deep", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3-groq-tool-use", - "name": "llama3-groq-tool-use", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizardlm", - "name": "wizardlm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-small3.2", - "name": "mistral-small3.2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 24000, - "default_max_tokens": 24000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "paraphrase-multilingual", - "name": "paraphrase-multilingual", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "falcon3", - "name": "falcon3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizardlm-uncensored", - "name": "wizardlm-uncensored", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "aya-expanse", - "name": "aya-expanse", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "orca2", - "name": "orca2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "smallthinker", - "name": "smallthinker", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama-guard3", - "name": "llama-guard3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite-embedding", - "name": "granite-embedding", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 512, - "default_max_tokens": 512, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "medllama2", - "name": "medllama2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nous-hermes2-mixtral", - "name": "nous-hermes2-mixtral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "stable-beluga", - "name": "stable-beluga", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "meditron", - "name": "meditron", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3-moe", - "name": "granite3-moe", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "r1-1776", - "name": "r1-1776", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.1-moe", - "name": "granite3.1-moe", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "deepseek-v2.5", - "name": "deepseek-v2.5", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "reader-lm", - "name": "reader-lm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama-pro", - "name": "llama-pro", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "yarn-mistral", - "name": "yarn-mistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "shieldgemma", - "name": "shieldgemma", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nexusraven", - "name": "nexusraven", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r7b", - "name": "command-r7b", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mathstral", - "name": "mathstral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "everythinglm", - "name": "everythinglm", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 16384, - "default_max_tokens": 16384, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "codeup", - "name": "codeup", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "marco-o1", - "name": "marco-o1", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "stablelm-zephyr", - "name": "stablelm-zephyr", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "tulu3", - "name": "tulu3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "solar-pro", - "name": "solar-pro", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "duckdb-nsql", - "name": "duckdb-nsql", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "phi4-mini-reasoning", - "name": "phi4-mini-reasoning", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "falcon2", - "name": "falcon2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "magicoder", - "name": "magicoder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistrallite", - "name": "mistrallite", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "codebooga", - "name": "codebooga", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "bespoke-minicheck", - "name": "bespoke-minicheck", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "wizard-vicuna", - "name": "wizard-vicuna", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nuextract", - "name": "nuextract", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3-guardian", - "name": "granite3-guardian", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "megadolphin", - "name": "megadolphin", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "notux", - "name": "notux", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "open-orca-platypus2", - "name": "open-orca-platypus2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "notus", - "name": "notus", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-a", - "name": "command-a", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 256000, - "default_max_tokens": 256000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "goliath", - "name": "goliath", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "sailor2", - "name": "sailor2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "firefunction-v2", - "name": "firefunction-v2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "alfred", - "name": "alfred", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "qwen3-coder", - "name": "qwen3-coder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, { "id": "command-r7b-arabic", "name": "command-r7b-arabic", "cost_per_1m_in": 0, "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 128000, "can_reason": true, diff --git a/internal/providers/new_models.json b/internal/providers/new_models.json new file mode 100644 index 00000000..7cdd7871 --- /dev/null +++ b/internal/providers/new_models.json @@ -0,0 +1,412 @@ +[ + { + "id": "deepseek-r1", + "name": "deepseek-r1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen3", + "name": "qwen3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3.1", + "name": "llama3.1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "llama3.2", + "name": "llama3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "mistral", + "name": "mistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2.5", + "name": "qwen2.5", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2.5-coder", + "name": "qwen2.5-coder", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwen2", + "name": "qwen2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3.3", + "name": "llama3.3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "mistral-nemo", + "name": "mistral-nemo", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "qwq", + "name": "qwq", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small", + "name": "mistral-small", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "smollm2", + "name": "smollm2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mixtral", + "name": "mixtral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama4", + "name": "llama4", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 10000000, + "default_max_tokens": 10000000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r", + "name": "command-r", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "hermes3", + "name": "hermes3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.3", + "name": "granite3.3", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "phi4-mini", + "name": "phi4-mini", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "magistral", + "name": "magistral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 40000, + "default_max_tokens": 40000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "devstral", + "name": "devstral", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "cogito", + "name": "cogito", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small3.1", + "name": "mistral-small3.1", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "granite3.2-vision", + "name": "granite3.2-vision", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 32000, + "default_max_tokens": 32000, + "can_reason": true, + "supports_attachments": true + }, + { + "id": "mistral-large", + "name": "mistral-large", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r-plus", + "name": "command-r-plus", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.2", + "name": "granite3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.1-dense", + "name": "granite3.1-dense", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3-dense", + "name": "granite3-dense", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "nemotron-mini", + "name": "nemotron-mini", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "athene-v2", + "name": "athene-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "nemotron", + "name": "nemotron", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 4096, + "default_max_tokens": 4096, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "llama3-groq-tool-use", + "name": "llama3-groq-tool-use", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 8192, + "default_max_tokens": 8192, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "mistral-small3.2", + "name": "mistral-small3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 24000, + "default_max_tokens": 24000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "aya-expanse", + "name": "aya-expanse", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "granite3-moe", + "name": "granite3-moe", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "granite3.1-moe", + "name": "granite3.1-moe", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r7b", + "name": "command-r7b", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-a", + "name": "command-a", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 256000, + "default_max_tokens": 256000, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "firefunction-v2", + "name": "firefunction-v2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 2048, + "default_max_tokens": 2048, + "can_reason": true, + "supports_attachments": false + }, + { + "id": "command-r7b-arabic", + "name": "command-r7b-arabic", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "context_window": 128000, + "default_max_tokens": 128000, + "can_reason": true, + "supports_attachments": false + } +] \ No newline at end of file From b533f95ca2ba0443647a64530166a108564613b4 Mon Sep 17 00:00:00 2001 From: Zachary Loeber Date: Sun, 3 Aug 2025 13:15:06 -0500 Subject: [PATCH 3/4] fix: Remove any models without tools support --- internal/providers/new_models.json | 412 ----------------------------- 1 file changed, 412 deletions(-) delete mode 100644 internal/providers/new_models.json diff --git a/internal/providers/new_models.json b/internal/providers/new_models.json deleted file mode 100644 index 7cdd7871..00000000 --- a/internal/providers/new_models.json +++ /dev/null @@ -1,412 +0,0 @@ -[ - { - "id": "deepseek-r1", - "name": "deepseek-r1", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwen3", - "name": "qwen3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3.1", - "name": "llama3.1", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "llama3.2", - "name": "llama3.2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "mistral", - "name": "mistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwen2.5", - "name": "qwen2.5", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwen2.5-coder", - "name": "qwen2.5-coder", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwen2", - "name": "qwen2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3.3", - "name": "llama3.3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "mistral-nemo", - "name": "mistral-nemo", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "qwq", - "name": "qwq", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-small", - "name": "mistral-small", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "smollm2", - "name": "smollm2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mixtral", - "name": "mixtral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama4", - "name": "llama4", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 10000000, - "default_max_tokens": 10000000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r", - "name": "command-r", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "hermes3", - "name": "hermes3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.3", - "name": "granite3.3", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "phi4-mini", - "name": "phi4-mini", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "magistral", - "name": "magistral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 40000, - "default_max_tokens": 40000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "devstral", - "name": "devstral", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "cogito", - "name": "cogito", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-small3.1", - "name": "mistral-small3.1", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "granite3.2-vision", - "name": "granite3.2-vision", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 32000, - "default_max_tokens": 32000, - "can_reason": true, - "supports_attachments": true - }, - { - "id": "mistral-large", - "name": "mistral-large", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r-plus", - "name": "command-r-plus", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.2", - "name": "granite3.2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.1-dense", - "name": "granite3.1-dense", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3-dense", - "name": "granite3-dense", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "nemotron-mini", - "name": "nemotron-mini", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "athene-v2", - "name": "athene-v2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "nemotron", - "name": "nemotron", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 4096, - "default_max_tokens": 4096, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "llama3-groq-tool-use", - "name": "llama3-groq-tool-use", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 8192, - "default_max_tokens": 8192, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "mistral-small3.2", - "name": "mistral-small3.2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 24000, - "default_max_tokens": 24000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "aya-expanse", - "name": "aya-expanse", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": false, - "supports_attachments": false - }, - { - "id": "granite3-moe", - "name": "granite3-moe", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "granite3.1-moe", - "name": "granite3.1-moe", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r7b", - "name": "command-r7b", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-a", - "name": "command-a", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 256000, - "default_max_tokens": 256000, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "firefunction-v2", - "name": "firefunction-v2", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 2048, - "default_max_tokens": 2048, - "can_reason": true, - "supports_attachments": false - }, - { - "id": "command-r7b-arabic", - "name": "command-r7b-arabic", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "context_window": 128000, - "default_max_tokens": 128000, - "can_reason": true, - "supports_attachments": false - } -] \ No newline at end of file From 7b0f7f1a66d71da00c8914f273afe58439fabd54 Mon Sep 17 00:00:00 2001 From: Zachary Loeber Date: Sun, 3 Aug 2025 13:19:11 -0500 Subject: [PATCH 4/4] fix: merge origin/main updates --- internal/providers/providers.go | 14 +++----------- 1 file changed, 3 insertions(+), 11 deletions(-) diff --git a/internal/providers/providers.go b/internal/providers/providers.go index 31debac1..846a6da0 100644 --- a/internal/providers/providers.go +++ b/internal/providers/providers.go @@ -36,15 +36,11 @@ var bedrockConfig []byte //go:embed configs/groq.json var groqConfig []byte -<<<<<<< HEAD -var ollamaConfig []byte - -||||||| ea52d41 -======= //go:embed configs/lambda.json var lambdaConfig []byte ->>>>>>> main +var ollamaConfig []byte + // ProviderFunc is a function that returns a Provider. type ProviderFunc func() catwalk.Provider @@ -58,12 +54,8 @@ var providerRegistry = []ProviderFunc{ xAIProvider, groqProvider, openRouterProvider, -<<<<<<< HEAD - ollamaProvider, -||||||| ea52d41 -======= lambdaProvider, ->>>>>>> main + ollamaProvider } // GetAll returns all registered providers.