From 34fd6673e5684ccc377fa821ff48af498d5703eb Mon Sep 17 00:00:00 2001 From: smakosh Date: Thu, 7 May 2026 22:20:52 +0200 Subject: [PATCH 1/3] chore(llmgateway): add new text models from llmgateway catalog Add gemini-3.1-flash-lite, grok-4-3, gpt-5.5, gpt-5.5-pro, qwen3.6 and MiMo v2 models that exist in llmgateway.io but were missing from models.dev. Adds parent definitions for grok-4-3, gemini-3.1-flash-lite, and qwen3.6-max-preview where they did not already exist. Co-Authored-By: Claude Opus 4.7 (1M context) --- .../alibaba/models/qwen3.6-max-preview.toml | 22 ++++++++++++++++ .../models/gemini-3.1-flash-lite.toml | 2 ++ .../google/models/gemini-3.1-flash-lite.toml | 25 +++++++++++++++++++ .../models/gemini-3.1-flash-lite.toml | 2 ++ providers/llmgateway/models/gpt-5.5-pro.toml | 2 ++ providers/llmgateway/models/gpt-5.5.toml | 2 ++ providers/llmgateway/models/grok-4-3.toml | 2 ++ providers/llmgateway/models/mimo-v2-omni.toml | 2 ++ providers/llmgateway/models/mimo-v2-pro.toml | 2 ++ .../llmgateway/models/mimo-v2.5-pro.toml | 2 ++ providers/llmgateway/models/mimo-v2.5.toml | 2 ++ .../llmgateway/models/qwen3.6-35b-a3b.toml | 2 ++ .../models/qwen3.6-max-preview.toml | 2 ++ providers/llmgateway/models/qwen3.6-plus.toml | 2 ++ providers/xai/models/grok-4-3.toml | 22 ++++++++++++++++ 15 files changed, 93 insertions(+) create mode 100644 providers/alibaba/models/qwen3.6-max-preview.toml create mode 100644 providers/google-vertex/models/gemini-3.1-flash-lite.toml create mode 100644 providers/google/models/gemini-3.1-flash-lite.toml create mode 100644 providers/llmgateway/models/gemini-3.1-flash-lite.toml create mode 100644 providers/llmgateway/models/gpt-5.5-pro.toml create mode 100644 providers/llmgateway/models/gpt-5.5.toml create mode 100644 providers/llmgateway/models/grok-4-3.toml create mode 100644 providers/llmgateway/models/mimo-v2-omni.toml create mode 100644 providers/llmgateway/models/mimo-v2-pro.toml create mode 100644 providers/llmgateway/models/mimo-v2.5-pro.toml create mode 100644 providers/llmgateway/models/mimo-v2.5.toml create mode 100644 providers/llmgateway/models/qwen3.6-35b-a3b.toml create mode 100644 providers/llmgateway/models/qwen3.6-max-preview.toml create mode 100644 providers/llmgateway/models/qwen3.6-plus.toml create mode 100644 providers/xai/models/grok-4-3.toml diff --git a/providers/alibaba/models/qwen3.6-max-preview.toml b/providers/alibaba/models/qwen3.6-max-preview.toml new file mode 100644 index 000000000..e64bc15e6 --- /dev/null +++ b/providers/alibaba/models/qwen3.6-max-preview.toml @@ -0,0 +1,22 @@ +name = "Qwen3.6 Max Preview" +family = "qwen" +release_date = "2026-05-07" +last_updated = "2026-05-07" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = false + +[cost] +input = 1.30 +output = 7.80 +cache_read = 0.13 + +[limit] +context = 262_144 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/google-vertex/models/gemini-3.1-flash-lite.toml b/providers/google-vertex/models/gemini-3.1-flash-lite.toml new file mode 100644 index 000000000..867a78b8e --- /dev/null +++ b/providers/google-vertex/models/gemini-3.1-flash-lite.toml @@ -0,0 +1,2 @@ +[extends] +from = "google/gemini-3.1-flash-lite" diff --git a/providers/google/models/gemini-3.1-flash-lite.toml b/providers/google/models/gemini-3.1-flash-lite.toml new file mode 100644 index 000000000..f8ef01f36 --- /dev/null +++ b/providers/google/models/gemini-3.1-flash-lite.toml @@ -0,0 +1,25 @@ +name = "Gemini 3.1 Flash Lite" +family = "gemini-flash-lite" +release_date = "2026-05-07" +last_updated = "2026-05-07" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +knowledge = "2025-01" +open_weights = false + +[cost] +input = 0.25 +output = 1.50 +cache_read = 0.025 +cache_write = 0.0833 + +[limit] +context = 1_048_576 +output = 65_536 + +[modalities] +input = ["text", "image", "video", "audio", "pdf"] +output = ["text"] diff --git a/providers/llmgateway/models/gemini-3.1-flash-lite.toml b/providers/llmgateway/models/gemini-3.1-flash-lite.toml new file mode 100644 index 000000000..867a78b8e --- /dev/null +++ b/providers/llmgateway/models/gemini-3.1-flash-lite.toml @@ -0,0 +1,2 @@ +[extends] +from = "google/gemini-3.1-flash-lite" diff --git a/providers/llmgateway/models/gpt-5.5-pro.toml b/providers/llmgateway/models/gpt-5.5-pro.toml new file mode 100644 index 000000000..97bc59ce0 --- /dev/null +++ b/providers/llmgateway/models/gpt-5.5-pro.toml @@ -0,0 +1,2 @@ +[extends] +from = "openai/gpt-5.5-pro" diff --git a/providers/llmgateway/models/gpt-5.5.toml b/providers/llmgateway/models/gpt-5.5.toml new file mode 100644 index 000000000..8ab9ada46 --- /dev/null +++ b/providers/llmgateway/models/gpt-5.5.toml @@ -0,0 +1,2 @@ +[extends] +from = "openai/gpt-5.5" diff --git a/providers/llmgateway/models/grok-4-3.toml b/providers/llmgateway/models/grok-4-3.toml new file mode 100644 index 000000000..b1353edd9 --- /dev/null +++ b/providers/llmgateway/models/grok-4-3.toml @@ -0,0 +1,2 @@ +[extends] +from = "xai/grok-4-3" diff --git a/providers/llmgateway/models/mimo-v2-omni.toml b/providers/llmgateway/models/mimo-v2-omni.toml new file mode 100644 index 000000000..71be0c3ad --- /dev/null +++ b/providers/llmgateway/models/mimo-v2-omni.toml @@ -0,0 +1,2 @@ +[extends] +from = "xiaomi/mimo-v2-omni" diff --git a/providers/llmgateway/models/mimo-v2-pro.toml b/providers/llmgateway/models/mimo-v2-pro.toml new file mode 100644 index 000000000..04dad856e --- /dev/null +++ b/providers/llmgateway/models/mimo-v2-pro.toml @@ -0,0 +1,2 @@ +[extends] +from = "xiaomi/mimo-v2-pro" diff --git a/providers/llmgateway/models/mimo-v2.5-pro.toml b/providers/llmgateway/models/mimo-v2.5-pro.toml new file mode 100644 index 000000000..c5ed14b6e --- /dev/null +++ b/providers/llmgateway/models/mimo-v2.5-pro.toml @@ -0,0 +1,2 @@ +[extends] +from = "xiaomi/mimo-v2.5-pro" diff --git a/providers/llmgateway/models/mimo-v2.5.toml b/providers/llmgateway/models/mimo-v2.5.toml new file mode 100644 index 000000000..412705bee --- /dev/null +++ b/providers/llmgateway/models/mimo-v2.5.toml @@ -0,0 +1,2 @@ +[extends] +from = "xiaomi/mimo-v2.5" diff --git a/providers/llmgateway/models/qwen3.6-35b-a3b.toml b/providers/llmgateway/models/qwen3.6-35b-a3b.toml new file mode 100644 index 000000000..53ab1ffad --- /dev/null +++ b/providers/llmgateway/models/qwen3.6-35b-a3b.toml @@ -0,0 +1,2 @@ +[extends] +from = "alibaba/qwen3.6-35b-a3b" diff --git a/providers/llmgateway/models/qwen3.6-max-preview.toml b/providers/llmgateway/models/qwen3.6-max-preview.toml new file mode 100644 index 000000000..207934cdf --- /dev/null +++ b/providers/llmgateway/models/qwen3.6-max-preview.toml @@ -0,0 +1,2 @@ +[extends] +from = "alibaba/qwen3.6-max-preview" diff --git a/providers/llmgateway/models/qwen3.6-plus.toml b/providers/llmgateway/models/qwen3.6-plus.toml new file mode 100644 index 000000000..feb038db2 --- /dev/null +++ b/providers/llmgateway/models/qwen3.6-plus.toml @@ -0,0 +1,2 @@ +[extends] +from = "alibaba/qwen3.6-plus" diff --git a/providers/xai/models/grok-4-3.toml b/providers/xai/models/grok-4-3.toml new file mode 100644 index 000000000..bf45530e3 --- /dev/null +++ b/providers/xai/models/grok-4-3.toml @@ -0,0 +1,22 @@ +name = "Grok 4.3" +family = "grok" +release_date = "2026-05-07" +last_updated = "2026-05-07" +attachment = true +reasoning = true +temperature = true +tool_call = true +open_weights = false + +[cost] +input = 1.25 +output = 2.50 +cache_read = 0.3125 + +[limit] +context = 1_000_000 +output = 30_000 + +[modalities] +input = ["text", "image"] +output = ["text"] From 70ac6fccdae12b018bb4d137d2224aa34132cdb7 Mon Sep 17 00:00:00 2001 From: smakosh Date: Thu, 7 May 2026 22:34:01 +0200 Subject: [PATCH 2/3] fix(models): use canonical entries for qwen3.6-max-preview and grok-4.3 Apply the canonical TOML provided by the LLM Gateway team for the Qwen3.6 Max Preview and Grok 4.3 parent definitions, replacing the upstream-merged variants whose dates and pricing did not match. Co-Authored-By: Claude Opus 4.7 (1M context) --- providers/alibaba/models/qwen3.6-max-preview.toml | 10 ++++------ providers/xai/models/grok-4.3.toml | 11 +++-------- 2 files changed, 7 insertions(+), 14 deletions(-) diff --git a/providers/alibaba/models/qwen3.6-max-preview.toml b/providers/alibaba/models/qwen3.6-max-preview.toml index 09a6c5458..e64bc15e6 100644 --- a/providers/alibaba/models/qwen3.6-max-preview.toml +++ b/providers/alibaba/models/qwen3.6-max-preview.toml @@ -1,19 +1,17 @@ name = "Qwen3.6 Max Preview" family = "qwen" -release_date = "2026-04-20" -last_updated = "2026-04-20" +release_date = "2026-05-07" +last_updated = "2026-05-07" attachment = false reasoning = true temperature = true -knowledge = "2025-04" tool_call = true open_weights = false [cost] -input = 1.3 -output = 7.8 +input = 1.30 +output = 7.80 cache_read = 0.13 -cache_write = 1.625 [limit] context = 262_144 diff --git a/providers/xai/models/grok-4.3.toml b/providers/xai/models/grok-4.3.toml index 3270efd4f..bf45530e3 100644 --- a/providers/xai/models/grok-4.3.toml +++ b/providers/xai/models/grok-4.3.toml @@ -1,7 +1,7 @@ name = "Grok 4.3" family = "grok" -release_date = "2026-05-01" -last_updated = "2026-05-01" +release_date = "2026-05-07" +last_updated = "2026-05-07" attachment = true reasoning = true temperature = true @@ -11,12 +11,7 @@ open_weights = false [cost] input = 1.25 output = 2.50 -cache_read = 0.20 - -[cost.context_over_200k] -input = 2.50 -output = 5.00 -cache_read = 0.40 +cache_read = 0.3125 [limit] context = 1_000_000 From 91590874e7b6cd36137638e0760cff8611ce25af Mon Sep 17 00:00:00 2001 From: smakosh Date: Fri, 8 May 2026 17:43:07 +0200 Subject: [PATCH 3/3] Revert "fix(models): use canonical entries for qwen3.6-max-preview and grok-4.3" This reverts commit 70ac6fccdae12b018bb4d137d2224aa34132cdb7. --- providers/alibaba/models/qwen3.6-max-preview.toml | 10 ++++++---- providers/xai/models/grok-4.3.toml | 11 ++++++++--- 2 files changed, 14 insertions(+), 7 deletions(-) diff --git a/providers/alibaba/models/qwen3.6-max-preview.toml b/providers/alibaba/models/qwen3.6-max-preview.toml index e64bc15e6..09a6c5458 100644 --- a/providers/alibaba/models/qwen3.6-max-preview.toml +++ b/providers/alibaba/models/qwen3.6-max-preview.toml @@ -1,17 +1,19 @@ name = "Qwen3.6 Max Preview" family = "qwen" -release_date = "2026-05-07" -last_updated = "2026-05-07" +release_date = "2026-04-20" +last_updated = "2026-04-20" attachment = false reasoning = true temperature = true +knowledge = "2025-04" tool_call = true open_weights = false [cost] -input = 1.30 -output = 7.80 +input = 1.3 +output = 7.8 cache_read = 0.13 +cache_write = 1.625 [limit] context = 262_144 diff --git a/providers/xai/models/grok-4.3.toml b/providers/xai/models/grok-4.3.toml index bf45530e3..3270efd4f 100644 --- a/providers/xai/models/grok-4.3.toml +++ b/providers/xai/models/grok-4.3.toml @@ -1,7 +1,7 @@ name = "Grok 4.3" family = "grok" -release_date = "2026-05-07" -last_updated = "2026-05-07" +release_date = "2026-05-01" +last_updated = "2026-05-01" attachment = true reasoning = true temperature = true @@ -11,7 +11,12 @@ open_weights = false [cost] input = 1.25 output = 2.50 -cache_read = 0.3125 +cache_read = 0.20 + +[cost.context_over_200k] +input = 2.50 +output = 5.00 +cache_read = 0.40 [limit] context = 1_000_000