Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
288 changes: 261 additions & 27 deletions packages/core/script/generate-wandb.ts

Large diffs are not rendered by default.

5 changes: 3 additions & 2 deletions providers/wandb/models/MiniMaxAI/MiniMax-M2.5.toml
Original file line number Diff line number Diff line change
@@ -1,9 +1,9 @@
name = "MiniMax M2.5"
family = "minimax"
release_date = "2026-02-12"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
reasoning = true
structured_output = true
temperature = true
tool_call = true
Expand All @@ -12,6 +12,7 @@ open_weights = true
[cost]
input = 0.3
output = 1.2
cache_read = 0.3

[limit]
context = 196_608
Expand Down
3 changes: 2 additions & 1 deletion providers/wandb/models/OpenPipe/Qwen3-14B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "OpenPipe Qwen3 14B Instruct"
family = "qwen"
release_date = "2025-04-29"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -12,6 +12,7 @@ open_weights = true
[cost]
input = 0.05
output = 0.22
cache_read = 0.05

[limit]
context = 32_768
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3 235B A22B Instruct 2507"
family = "qwen"
release_date = "2025-04-28"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -13,6 +13,7 @@ open_weights = true
[cost]
input = 0.1
output = 0.1
cache_read = 0.1

[limit]
context = 262_144
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3-235B-A22B-Thinking-2507"
family = "qwen"
release_date = "2025-07-25"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = true
structured_output = true
Expand All @@ -13,6 +13,7 @@ open_weights = true
[cost]
input = 0.1
output = 0.1
cache_read = 0.1

[limit]
context = 262_144
Expand Down
3 changes: 2 additions & 1 deletion providers/wandb/models/Qwen/Qwen3-30B-A3B-Instruct-2507.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3 30B A3B Instruct 2507"
family = "qwen"
release_date = "2025-07-29"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -12,6 +12,7 @@ open_weights = true
[cost]
input = 0.1
output = 0.3
cache_read = 0.1

[limit]
context = 262_144
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3-Coder-480B-A35B-Instruct"
family = "qwen"
release_date = "2025-07-23"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -13,6 +13,7 @@ open_weights = true
[cost]
input = 1
output = 1.5
cache_read = 1

[limit]
context = 262_144
Expand Down
23 changes: 23 additions & 0 deletions providers/wandb/models/Qwen/Qwen3.5-27B.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "Qwen3.5 27B"
family = "qwen3.5"
release_date = "2026-02-24"
last_updated = "2026-05-19"
attachment = true
reasoning = true
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.39
output = 3.12
cache_read = 0.08

[limit]
context = 262_144
output = 262_144

[modalities]
input = ["text", "image"]
output = ["text"]
23 changes: 23 additions & 0 deletions providers/wandb/models/Qwen/Qwen3.5-35B-A3B.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "Qwen3.5 35B A3B"
family = "qwen3.5"
release_date = "2026-02-24"
last_updated = "2026-05-19"
attachment = true
reasoning = true
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.25
output = 1.25
cache_read = 0.25

[limit]
context = 262_144
output = 262_144

[modalities]
input = ["text", "image"]
output = ["text"]
23 changes: 23 additions & 0 deletions providers/wandb/models/Qwen/Qwen3.6-27B.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "Qwen3.6 27B"
family = "qwen3.6"
release_date = "2026-04-22"
last_updated = "2026-05-19"
attachment = true
reasoning = true
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.6
output = 3.6
cache_read = 0.12

[limit]
context = 262_144
output = 262_144

[modalities]
input = ["text", "image"]
output = ["text"]
23 changes: 23 additions & 0 deletions providers/wandb/models/Qwen/Qwen3.6-35B-A3B.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "Qwen3.6 35B A3B"
family = "qwen3.6"
release_date = "2026-04-15"
last_updated = "2026-05-19"
attachment = true
reasoning = true
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.25
output = 1.25
cache_read = 0.25

[limit]
context = 262_144
output = 262_144

[modalities]
input = ["text", "image"]
output = ["text"]
3 changes: 2 additions & 1 deletion providers/wandb/models/deepseek-ai/DeepSeek-V3.1.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "DeepSeek V3.1"
family = "deepseek"
release_date = "2025-08-21"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -12,6 +12,7 @@ open_weights = true
[cost]
input = 0.55
output = 1.65
cache_read = 0.55

[limit]
context = 161_000
Expand Down
23 changes: 23 additions & 0 deletions providers/wandb/models/deepseek-ai/DeepSeek-V4-Flash.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "DeepSeek V4 Flash"
family = "deepseek"
release_date = "2026-04-24"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.14
output = 0.28
cache_read = 0.07

[limit]
context = 1_048_576
output = 1_048_576

[modalities]
input = ["text"]
output = ["text"]
23 changes: 23 additions & 0 deletions providers/wandb/models/deepseek-ai/DeepSeek-V4-Pro.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "DeepSeek V4 Pro"
family = "deepseek"
release_date = "2026-04-24"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 1.74
output = 3.48
cache_read = 0.14

[limit]
context = 1_048_576
output = 1_048_576

[modalities]
input = ["text"]
output = ["text"]
23 changes: 23 additions & 0 deletions providers/wandb/models/google/gemma-4-31B-it.toml
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
name = "Gemma 4 31B"
family = "gemma"
release_date = "2026-04-02"
last_updated = "2026-05-19"
attachment = true
reasoning = true
structured_output = true
temperature = true
tool_call = true
open_weights = true

[cost]
input = 0.3
output = 1.25
cache_read = 0.3

[limit]
context = 262_144
output = 262_144

[modalities]
input = ["text", "image"]
output = ["text"]
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "GLM 5"
family = "glm"
release_date = "2026-02-11"
last_updated = "2026-03-12"
name = "Granite 4.1 8B"
family = "granite"
release_date = "2026-04-29"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -10,12 +10,13 @@ tool_call = true
open_weights = true

[cost]
input = 1
output = 3.2
input = 0.05
output = 0.1
cache_read = 0.05

[limit]
context = 200_000
output = 200_000
context = 131_072
output = 131_072

[modalities]
input = ["text"]
Expand Down
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Llama 3.1 70B"
family = "llama"
release_date = "2024-07-23"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = false
structured_output = true
Expand All @@ -12,6 +12,7 @@ open_weights = true
[cost]
input = 0.8
output = 0.8
cache_read = 0.8

[limit]
context = 128_000
Expand Down
5 changes: 3 additions & 2 deletions providers/wandb/models/meta-llama/Llama-3.1-8B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,9 +1,9 @@
name = "Meta-Llama-3.1-8B-Instruct"
family = "llama"
release_date = "2024-07-23"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = true
reasoning = false
structured_output = true
temperature = true
tool_call = true
Expand All @@ -13,6 +13,7 @@ open_weights = true
[cost]
input = 0.22
output = 0.22
cache_read = 0.22

[limit]
context = 128_000
Expand Down
5 changes: 3 additions & 2 deletions providers/wandb/models/meta-llama/Llama-3.3-70B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,9 +1,9 @@
name = "Llama-3.3-70B-Instruct"
family = "llama"
release_date = "2024-12-06"
last_updated = "2026-03-12"
last_updated = "2026-05-19"
attachment = false
reasoning = true
reasoning = false
structured_output = true
temperature = true
tool_call = true
Expand All @@ -13,6 +13,7 @@ open_weights = true
[cost]
input = 0.71
output = 0.71
cache_read = 0.71

[limit]
context = 128_000
Expand Down
Original file line number Diff line number Diff line change
@@ -1,13 +1,13 @@
name = "Llama 4 Scout 17B 16E Instruct"
family = "llama"
release_date = "2025-01-31"
last_updated = "2026-03-12"
attachment = false
reasoning = true
release_date = "2025-04-05"
last_updated = "2026-05-19"
attachment = true
reasoning = false
structured_output = true
temperature = true
tool_call = true
knowledge = "2024-12"
knowledge = "2024-08"
open_weights = true

[cost]
Expand Down
Loading