Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
19 changes: 7 additions & 12 deletions providers/chutes/models/MiniMaxAI/MiniMax-M2.1-TEE.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "MiniMax M2.1 TEE"
family = "minimaxai"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = true
temperature = true
Expand All @@ -10,21 +10,16 @@ structured_output = true
open_weights = true

[cost]
input = 0.3
output = 1.2
reasoning = 1.8
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0
input = 0.30
output = 1.20

[limit]
context = 196608
output = 65536
context = 196_608
output = 65_536

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "DeepHermes 3 Mistral 24B Preview"
family = "nousresearch"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -11,16 +11,12 @@ open_weights = true

[cost]
input = 0.02
output = 0.1
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0
output = 0.10

[limit]
context = 32768
output = 32768
context = 32_768
output = 32_768

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]
15 changes: 5 additions & 10 deletions providers/chutes/models/NousResearch/Hermes-4-14B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Hermes 4 14B"
family = "nousresearch"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = true
temperature = true
Expand All @@ -12,19 +12,14 @@ open_weights = true
[cost]
input = 0.01
output = 0.05
reasoning = 0.075
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 40960
output = 40960
context = 40_960
output = 40_960

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
15 changes: 7 additions & 8 deletions providers/chutes/models/NousResearch/Hermes-4-405B-FP8-TEE.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Hermes 4 405B FP8 TEE"
family = "nousresearch"
release_date = "2025-12-29"
last_updated = "2025-01-06"
last_updated = "2026-01-10"
attachment = false
reasoning = true
temperature = true
Expand All @@ -10,17 +10,16 @@ structured_output = true
open_weights = true

[cost]
input = 0.3
output = 1.2
reasoning = 1.8
input = 0.30
output = 1.20

[limit]
context = 131072
output = 65536
context = 131_072
output = 65_536

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
15 changes: 5 additions & 10 deletions providers/chutes/models/NousResearch/Hermes-4-70B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Hermes 4 70B"
family = "nousresearch"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = true
temperature = true
Expand All @@ -12,19 +12,14 @@ open_weights = true
[cost]
input = 0.11
output = 0.38
reasoning = 0.57
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 131072
output = 131072
context = 131_072
output = 131_072

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
16 changes: 6 additions & 10 deletions providers/chutes/models/NousResearch/Hermes-4.3-36B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Hermes 4.3 36B"
family = "nousresearch"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -10,17 +10,13 @@ structured_output = false
open_weights = true

[cost]
input = 0.1
input = 0.10
output = 0.39
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 524288
output = 524288
context = 32_768
output = 8_192

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]
13 changes: 6 additions & 7 deletions providers/chutes/models/OpenGVLab/InternVL3-78B-TEE.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "InternVL3 78B TEE"
family = "opengvlab"
release_date = "2025-01-06"
last_updated = "2025-01-06"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -10,14 +10,13 @@ structured_output = true
open_weights = true

[cost]
input = 0.1
input = 0.10
output = 0.39

[limit]
context = 32768
output = 32768
context = 32_768
output = 32_768

[modalities]
input = ['text', 'image']
output = ['text']

input = ["text", "image"]
output = ["text"]
14 changes: 5 additions & 9 deletions providers/chutes/models/Qwen/Qwen2.5-72B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen2.5 72B Instruct"
family = "qwen"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -12,15 +12,11 @@ open_weights = true
[cost]
input = 0.13
output = 0.52
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 32768
output = 32768
context = 32_768
output = 32_768

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]
14 changes: 5 additions & 9 deletions providers/chutes/models/Qwen/Qwen2.5-Coder-32B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen2.5 Coder 32B Instruct"
family = "qwen"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -12,15 +12,11 @@ open_weights = true
[cost]
input = 0.03
output = 0.11
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 32768
output = 32768
context = 32_768
output = 32_768

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]
14 changes: 5 additions & 9 deletions providers/chutes/models/Qwen/Qwen2.5-VL-32B-Instruct.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen2.5 VL 32B Instruct"
family = "qwen"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
Expand All @@ -12,15 +12,11 @@ open_weights = true
[cost]
input = 0.05
output = 0.22
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 16384
output = 16384
context = 16_384
output = 16_384

[modalities]
input = ['text', 'image']
output = ['text']
input = ["text", "image"]
output = ["text"]
18 changes: 7 additions & 11 deletions providers/chutes/models/Qwen/Qwen2.5-VL-72B-Instruct-TEE.toml
Original file line number Diff line number Diff line change
@@ -1,26 +1,22 @@
name = "Qwen2.5 VL 72B Instruct TEE"
family = "qwen"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = false
temperature = true
tool_call = false
structured_output = false
structured_output = true
open_weights = true

[cost]
input = 0.15
output = 0.6
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0
output = 0.60

[limit]
context = 40960
output = 40960
context = 32_768
output = 32_768

[modalities]
input = ['text', 'image']
output = ['text']
input = ["text", "image"]
output = ["text"]
15 changes: 5 additions & 10 deletions providers/chutes/models/Qwen/Qwen3-14B.toml
Original file line number Diff line number Diff line change
@@ -1,7 +1,7 @@
name = "Qwen3 14B"
family = "qwen"
release_date = "2025-12-29"
last_updated = "2025-12-29"
last_updated = "2026-01-10"
attachment = false
reasoning = true
temperature = true
Expand All @@ -12,19 +12,14 @@ open_weights = true
[cost]
input = 0.05
output = 0.22
reasoning = 0.33
cache_read = 0.0
cache_write = 0.0
input_audio = 0.0
output_audio = 0.0

[limit]
context = 40960
output = 40960
context = 40_960
output = 40_960

[modalities]
input = ['text']
output = ['text']
input = ["text"]
output = ["text"]

[interleaved]
field = "reasoning_content"
Loading