Skip to content

Commit 59831a9

Browse files
authored
Merge pull request #1399 from dpuyosa/venice-model-updates-2026-04-09
Venice: Update model configs with refreshed pricing and limits
2 parents c7552d0 + c3a2b1a commit 59831a9

File tree

6 files changed

+28
-24
lines changed

6 files changed

+28
-24
lines changed

providers/venice/models/google.gemma-4-26b-a4b-it.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ tool_call = true
66
structured_output = true
77
temperature = true
88
release_date = "2026-04-02"
9-
last_updated = "2026-04-04"
9+
last_updated = "2026-04-09"
1010
open_weights = true
1111

1212
[cost]
@@ -15,7 +15,7 @@ output = 0.5
1515

1616
[limit]
1717
context = 256_000
18-
output = 12_288
18+
output = 8_192
1919

2020
[modalities]
2121
input = ["text", "image", "video"]

providers/venice/models/google.gemma-4-31b-it.toml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ tool_call = true
66
structured_output = true
77
temperature = true
88
release_date = "2026-04-03"
9-
last_updated = "2026-04-04"
9+
last_updated = "2026-04-09"
1010
open_weights = true
1111

1212
[cost]
@@ -15,7 +15,7 @@ output = 0.5
1515

1616
[limit]
1717
context = 256_000
18-
output = 12_288
18+
output = 8_192
1919

2020
[modalities]
2121
input = ["text", "image", "video"]

providers/venice/models/grok-4-20-beta.toml

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -6,18 +6,18 @@ tool_call = true
66
structured_output = true
77
temperature = true
88
release_date = "2026-03-12"
9-
last_updated = "2026-03-16"
9+
last_updated = "2026-04-09"
1010
open_weights = false
1111

1212
[cost]
13-
input = 2.5
14-
output = 7.5
15-
cache_read = 0.25
13+
input = 2.27
14+
output = 6.8
15+
cache_read = 0.23
1616

1717
[cost.context_over_200k]
18-
input = 5
19-
output = 15
20-
cache_read = 0.25
18+
input = 4.53
19+
output = 13.6
20+
cache_read = 0.23
2121

2222
[limit]
2323
context = 2_000_000

providers/venice/models/grok-4-20-multi-agent-beta.toml

Lines changed: 7 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -6,18 +6,18 @@ tool_call = false
66
structured_output = true
77
temperature = true
88
release_date = "2026-03-12"
9-
last_updated = "2026-03-16"
9+
last_updated = "2026-04-09"
1010
open_weights = false
1111

1212
[cost]
13-
input = 2.5
14-
output = 7.5
15-
cache_read = 0.25
13+
input = 2.27
14+
output = 6.8
15+
cache_read = 0.23
1616

1717
[cost.context_over_200k]
18-
input = 5
19-
output = 15
20-
cache_read = 0.25
18+
input = 4.53
19+
output = 13.6
20+
cache_read = 0.23
2121

2222
[limit]
2323
context = 2_000_000

providers/venice/models/grok-41-fast.toml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -7,13 +7,13 @@ structured_output = true
77
temperature = true
88
knowledge = "2025-07"
99
release_date = "2025-12-01"
10-
last_updated = "2026-03-12"
10+
last_updated = "2026-04-09"
1111
open_weights = false
1212

1313
[cost]
14-
input = 0.25
15-
output = 0.625
16-
cache_read = 0.0625
14+
input = 0.23
15+
output = 0.57
16+
cache_read = 0.06
1717

1818
[limit]
1919
context = 1_000_000

providers/venice/models/qwen-3-6-plus.toml

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,12 @@
1-
name = "Qwen 3.6 Plus"
1+
name = "Qwen 3.6 Plus Uncensored"
22
family = "qwen"
33
attachment = true
44
reasoning = true
55
tool_call = true
66
structured_output = true
77
temperature = true
88
release_date = "2026-04-06"
9-
last_updated = "2026-04-07"
9+
last_updated = "2026-04-09"
1010
open_weights = false
1111

1212
[cost]
@@ -15,6 +15,10 @@ output = 3.75
1515
cache_read = 0.0625
1616
cache_write = 0.78
1717

18+
[cost.context_over_200k]
19+
input = 2.5
20+
output = 7.5
21+
1822
[limit]
1923
context = 1_000_000
2024
output = 65_536

0 commit comments

Comments
 (0)