Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 4 additions & 4 deletions providers/wafer.ai/models/GLM-5.1.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "GLM-5.1"
family = "glm"
release_date = "2026-04-07"
last_updated = "2026-04-07"
last_updated = "2026-05-30"
knowledge = "2025-04"
attachment = false
reasoning = true
Expand All @@ -11,9 +11,9 @@ structured_output = true
open_weights = true

[cost]
input = 0
output = 0
cache_read = 0
input = 1.20
output = 3.60
cache_read = 0.12
cache_write = 0

[limit]
Expand Down
12 changes: 6 additions & 6 deletions providers/wafer.ai/models/Kimi-K2.6.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Kimi K2.6"
name = "Kimi-K2.6"
family = "kimi"
release_date = "2026-05-13"
last_updated = "2026-05-13"
last_updated = "2026-05-30"
knowledge = "2025-01"
attachment = true
reasoning = true
Expand All @@ -11,15 +11,15 @@ structured_output = true
open_weights = true

[cost]
input = 1.10
output = 4.80
cache_read = 0.11
input = 0.88
output = 3.84
cache_read = 0.09
cache_write = 0

[limit]
context = 262_144
output = 65_536

[modalities]
input = ["text", "image"]
input = ["text", "image", "video"]
output = ["text"]
10 changes: 5 additions & 5 deletions providers/wafer.ai/models/Qwen3.5-397B-A17B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3.5 397B A17B"
name = "Qwen3.5-397B-A17B"
family = "qwen"
release_date = "2026-02-16"
last_updated = "2026-02-16"
last_updated = "2026-05-30"
knowledge = "2025-04"
attachment = true
reasoning = true
Expand All @@ -11,9 +11,9 @@ structured_output = true
open_weights = true

[cost]
input = 0
output = 0
cache_read = 0
input = 0.48
output = 2.88
cache_read = 0.05
cache_write = 0

[limit]
Expand Down
13 changes: 7 additions & 6 deletions providers/wafer.ai/models/Qwen3.6-35B-A3B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3.6 35B A3B"
name = "Qwen3.6-35B-A3B"
family = "qwen"
release_date = "2026-05-11"
last_updated = "2026-05-11"
last_updated = "2026-05-30"
knowledge = "2025-04"
attachment = true
reasoning = true
Expand All @@ -11,14 +11,15 @@ structured_output = true
open_weights = true

[cost]
input = 0.19
output = 1.25
input = 0.15
output = 1.00
cache_read = 0.02
cache_write = 0

[limit]
context = 32_768
output = 16_384
context = 256_000
input = 229_376
output = 65_536

[modalities]
input = ["text", "image", "video"]
Expand Down
28 changes: 28 additions & 0 deletions providers/wafer.ai/models/deepseek-v4-flash.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
name = "DeepSeek V4 Flash"
family = "deepseek-flash"
release_date = "2026-04-24"
last_updated = "2026-05-30"
knowledge = "2025-05"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
open_weights = true

[cost]
input = 0.14
output = 0.28
cache_read = 0.01
cache_write = 0

[limit]
context = 1_000_000
output = 384_000

[modalities]
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
28 changes: 28 additions & 0 deletions providers/wafer.ai/models/deepseek-v4-pro.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,28 @@
name = "DeepSeek V4 Pro"
family = "deepseek-thinking"
release_date = "2026-04-24"
last_updated = "2026-05-30"
knowledge = "2025-05"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
open_weights = true

[cost]
input = 1.74
output = 3.48
cache_read = 0.02
cache_write = 0

[limit]
context = 1_000_000
output = 384_000

[modalities]
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
24 changes: 24 additions & 0 deletions providers/wafer.ai/models/qwen3.7-max.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,24 @@
name = "Qwen3.7-Max"
family = "qwen3.7-max"
release_date = "2026-05-21"
last_updated = "2026-05-30"
attachment = false
reasoning = true
temperature = true
tool_call = true
structured_output = true
open_weights = false

[cost]
input = 5.00
output = 15.00
cache_read = 0.50
cache_write = 0

[limit]
context = 256_000
output = 65_536

[modalities]
input = ["text"]
output = ["text"]
Loading