Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
26 changes: 26 additions & 0 deletions providers/google-vertex/models/deepseek-ai/deepseek-v3.1-maas.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
name = "DeepSeek V3.1"
family = "deepseek"
release_date = "2025-08-28"
last_updated = "2025-08-28"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
open_weights = true

[cost]
input = 0.60
output = 1.70

[limit]
context = 163_840
output = 32_768

[modalities]
input = ["text", "pdf"]
output = ["text"]

[provider]
npm = "@ai-sdk/openai-compatible"
api = "https://${GOOGLE_VERTEX_ENDPOINT}/v1/projects/${GOOGLE_VERTEX_PROJECT}/locations/${GOOGLE_VERTEX_LOCATION}/endpoints/openapi"
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
name = "Llama 3.3 70B Instruct"
family = "llama"
release_date = "2025-04-29"
last_updated = "2025-04-29"
attachment = false
reasoning = false
temperature = true
tool_call = true
structured_output = true
knowledge = "2023-12"
open_weights = true

[cost]
input = 0.72
output = 0.72

[limit]
context = 128_000
output = 8_192

[modalities]
input = ["text"]
output = ["text"]

[provider]
npm = "@ai-sdk/openai-compatible"
api = "https://${GOOGLE_VERTEX_ENDPOINT}/v1/projects/${GOOGLE_VERTEX_PROJECT}/locations/${GOOGLE_VERTEX_LOCATION}/endpoints/openapi"
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
name = "Llama 4 Maverick 17B 128E Instruct"
family = "llama"
release_date = "2025-04-29"
last_updated = "2025-04-29"
attachment = true
reasoning = false
temperature = true
tool_call = true
structured_output = true
knowledge = "2024-08"
open_weights = true

[cost]
input = 0.35
output = 1.15

[limit]
context = 524_288
output = 8_192

[modalities]
input = ["text", "image"]
output = ["text"]

[provider]
npm = "@ai-sdk/openai-compatible"
api = "https://${GOOGLE_VERTEX_ENDPOINT}/v1/projects/${GOOGLE_VERTEX_PROJECT}/locations/${GOOGLE_VERTEX_LOCATION}/endpoints/openapi"
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
name = "Qwen3 235B A22B Instruct"
family = "qwen"
release_date = "2025-08-13"
last_updated = "2025-08-13"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
open_weights = true

[cost]
input = 0.22
output = 0.88

[limit]
context = 262_144
output = 16_384

[modalities]
input = ["text"]
output = ["text"]

[provider]
npm = "@ai-sdk/openai-compatible"
api = "https://${GOOGLE_VERTEX_ENDPOINT}/v1/projects/${GOOGLE_VERTEX_PROJECT}/locations/${GOOGLE_VERTEX_LOCATION}/endpoints/openapi"
19 changes: 12 additions & 7 deletions providers/google-vertex/models/zai-org/glm-4.7-maas.toml
Original file line number Diff line number Diff line change
@@ -1,25 +1,30 @@
name = "GLM-4.7"
family = "glm"
release_date = "2025-12-22"
last_updated = "2025-12-22"
release_date = "2026-01-06"
last_updated = "2026-01-06"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
knowledge = "2025-04"
open_weights = true

[interleaved]
field = "reasoning_content"

[cost]
input = 0.6
output = 2.2
input = 0.60
output = 2.20

[limit]
context = 204800
output = 131072
context = 200_000
output = 128_000

[modalities]
input = ["text"]
input = ["text", "pdf"]
output = ["text"]

[provider]
npm = "@ai-sdk/openai-compatible"
api = "https://${GOOGLE_VERTEX_ENDPOINT}/v1/projects/${GOOGLE_VERTEX_PROJECT}/locations/${GOOGLE_VERTEX_LOCATION}/endpoints/openapi"