diff --git a/providers/google-vertex-openai/models/deepseek-v3.1-maas.toml b/providers/google-vertex-openai/models/deepseek-v3.1-maas.toml new file mode 100644 index 000000000..22b1b3b28 --- /dev/null +++ b/providers/google-vertex-openai/models/deepseek-v3.1-maas.toml @@ -0,0 +1,22 @@ +name = "DeepSeek V3.1" +family = "deepseek" +release_date = "2025-06-01" +last_updated = "2025-06-01" +attachment = false +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-05" +open_weights = true + +[cost] +input = 0.27 +output = 1.10 + +[limit] +context = 131072 +output = 32768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/google-vertex/models/zai-org/glm-4.7-maas.toml b/providers/google-vertex-openai/models/glm-4.7-maas.toml similarity index 100% rename from providers/google-vertex/models/zai-org/glm-4.7-maas.toml rename to providers/google-vertex-openai/models/glm-4.7-maas.toml diff --git a/providers/google-vertex-openai/models/llama-3.3-70b-instruct-maas.toml b/providers/google-vertex-openai/models/llama-3.3-70b-instruct-maas.toml new file mode 100644 index 000000000..984220fb1 --- /dev/null +++ b/providers/google-vertex-openai/models/llama-3.3-70b-instruct-maas.toml @@ -0,0 +1,22 @@ +name = "Llama 3.3 70B Instruct" +family = "llama" +release_date = "2024-12-06" +last_updated = "2024-12-06" +attachment = false +reasoning = true +temperature = true +tool_call = true +knowledge = "2024-12" +open_weights = true + +[cost] +input = 0.20 +output = 0.20 + +[limit] +context = 131072 +output = 32768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/google-vertex-openai/models/llama-4-maverick-17b-128e-instruct-maas.toml b/providers/google-vertex-openai/models/llama-4-maverick-17b-128e-instruct-maas.toml new file mode 100644 index 000000000..8d3242a26 --- /dev/null +++ b/providers/google-vertex-openai/models/llama-4-maverick-17b-128e-instruct-maas.toml @@ -0,0 +1,22 @@ +name = "Llama 4 Maverick 17B-128E" +family = "llama" +release_date = "2025-04-05" +last_updated = "2025-04-05" +attachment = true +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-03" +open_weights = true + +[cost] +input = 0.18 +output = 0.59 + +[limit] +context = 1048576 +output = 131072 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/google-vertex-openai/models/qwen3-235b-a22b-instruct-2507-maas.toml b/providers/google-vertex-openai/models/qwen3-235b-a22b-instruct-2507-maas.toml new file mode 100644 index 000000000..ad27a64c1 --- /dev/null +++ b/providers/google-vertex-openai/models/qwen3-235b-a22b-instruct-2507-maas.toml @@ -0,0 +1,22 @@ +name = "Qwen3 235B Instruct" +family = "qwen" +release_date = "2025-07-25" +last_updated = "2025-07-25" +attachment = false +reasoning = true +temperature = true +tool_call = true +knowledge = "2025-06" +open_weights = true + +[cost] +input = 0.30 +output = 1.20 + +[limit] +context = 131072 +output = 32768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/google-vertex-openai/provider.toml b/providers/google-vertex-openai/provider.toml new file mode 100644 index 000000000..fef5aab69 --- /dev/null +++ b/providers/google-vertex-openai/provider.toml @@ -0,0 +1,4 @@ +name = "Vertex (OpenAI-Compatible)" +env = ["GOOGLE_CLOUD_PROJECT", "GOOGLE_VERTEX_PROJECT", "GCP_PROJECT", "GCLOUD_PROJECT", "GOOGLE_CLOUD_LOCATION", "VERTEX_LOCATION", "GOOGLE_APPLICATION_CREDENTIALS"] +npm = "@ai-sdk/openai-compatible" +doc = "https://cloud.google.com/vertex-ai/generative-ai/docs/maas/call-open-model-apis" diff --git a/providers/google-vertex/models/openai/gpt-oss-120b-maas.toml b/providers/google-vertex/models/openai/gpt-oss-120b-maas.toml deleted file mode 100644 index aeab25caf..000000000 --- a/providers/google-vertex/models/openai/gpt-oss-120b-maas.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT OSS 120B" -family = "gpt-oss" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[cost] -input = 0.09 -output = 0.36 - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"] diff --git a/providers/google-vertex/models/openai/gpt-oss-20b-maas.toml b/providers/google-vertex/models/openai/gpt-oss-20b-maas.toml deleted file mode 100644 index 6c943fd99..000000000 --- a/providers/google-vertex/models/openai/gpt-oss-20b-maas.toml +++ /dev/null @@ -1,21 +0,0 @@ -name = "GPT OSS 20B" -family = "gpt-oss" -release_date = "2025-08-05" -last_updated = "2025-08-05" -attachment = false -reasoning = true -temperature = true -tool_call = true -open_weights = true - -[cost] -input = 0.07 -output = 0.25 - -[limit] -context = 131_072 -output = 32_768 - -[modalities] -input = ["text"] -output = ["text"]