Skip to content

Commit ada7411

Browse files
authored
Tweaks to baseten model definitions (#9866)
1 parent 721b02e commit ada7411

File tree

1 file changed

+12
-11
lines changed

1 file changed

+12
-11
lines changed

packages/types/src/providers/baseten.ts

Lines changed: 12 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@ import type { ModelInfo } from "../model.js"
55

66
export const basetenModels = {
77
"moonshotai/Kimi-K2-Thinking": {
8-
maxTokens: 163_800,
8+
maxTokens: 16_384,
99
contextWindow: 262_000,
1010
supportsImages: false,
1111
supportsPromptCache: false,
@@ -17,7 +17,7 @@ export const basetenModels = {
1717
description: "Kimi K2 Thinking - A model with enhanced reasoning capabilities from Kimi K2",
1818
},
1919
"zai-org/GLM-4.6": {
20-
maxTokens: 200_000,
20+
maxTokens: 16_384,
2121
contextWindow: 200_000,
2222
supportsImages: false,
2323
supportsPromptCache: false,
@@ -29,7 +29,7 @@ export const basetenModels = {
2929
description: "Frontier open model with advanced agentic, reasoning and coding capabilities",
3030
},
3131
"deepseek-ai/DeepSeek-R1": {
32-
maxTokens: 131_072,
32+
maxTokens: 16_384,
3333
contextWindow: 163_840,
3434
supportsImages: false,
3535
supportsPromptCache: false,
@@ -40,7 +40,7 @@ export const basetenModels = {
4040
description: "DeepSeek's first-generation reasoning model",
4141
},
4242
"deepseek-ai/DeepSeek-R1-0528": {
43-
maxTokens: 131_072,
43+
maxTokens: 16_384,
4444
contextWindow: 163_840,
4545
supportsImages: false,
4646
supportsPromptCache: false,
@@ -51,7 +51,7 @@ export const basetenModels = {
5151
description: "The latest revision of DeepSeek's first-generation reasoning model",
5252
},
5353
"deepseek-ai/DeepSeek-V3-0324": {
54-
maxTokens: 131_072,
54+
maxTokens: 16_384,
5555
contextWindow: 163_840,
5656
supportsImages: false,
5757
supportsPromptCache: false,
@@ -62,7 +62,7 @@ export const basetenModels = {
6262
description: "Fast general-purpose LLM with enhanced reasoning capabilities",
6363
},
6464
"deepseek-ai/DeepSeek-V3.1": {
65-
maxTokens: 131_072,
65+
maxTokens: 16_384,
6666
contextWindow: 163_840,
6767
supportsImages: false,
6868
supportsPromptCache: false,
@@ -74,10 +74,11 @@ export const basetenModels = {
7474
"Extremely capable general-purpose LLM with hybrid reasoning capabilities and advanced tool calling",
7575
},
7676
"deepseek-ai/DeepSeek-V3.2": {
77-
maxTokens: 131_072,
77+
maxTokens: 16_384,
7878
contextWindow: 163_840,
7979
supportsImages: false,
8080
supportsPromptCache: false,
81+
supportsNativeTools: true,
8182
inputPrice: 0.3,
8283
outputPrice: 0.45,
8384
cacheWritesPrice: 0,
@@ -86,7 +87,7 @@ export const basetenModels = {
8687
"DeepSeek's hybrid reasoning model with efficient long context scaling with GPT-5 level performance",
8788
},
8889
"Qwen/Qwen3-235B-A22B-Instruct-2507": {
89-
maxTokens: 262_144,
90+
maxTokens: 16_384,
9091
contextWindow: 262_144,
9192
supportsImages: false,
9293
supportsPromptCache: false,
@@ -97,7 +98,7 @@ export const basetenModels = {
9798
description: "Mixture-of-experts LLM with math and reasoning capabilities",
9899
},
99100
"Qwen/Qwen3-Coder-480B-A35B-Instruct": {
100-
maxTokens: 262_144,
101+
maxTokens: 16_384,
101102
contextWindow: 262_144,
102103
supportsImages: false,
103104
supportsPromptCache: false,
@@ -108,7 +109,7 @@ export const basetenModels = {
108109
description: "Mixture-of-experts LLM with advanced coding and reasoning capabilities",
109110
},
110111
"openai/gpt-oss-120b": {
111-
maxTokens: 128_072,
112+
maxTokens: 16_384,
112113
contextWindow: 128_072,
113114
supportsImages: false,
114115
supportsPromptCache: false,
@@ -120,7 +121,7 @@ export const basetenModels = {
120121
description: "Extremely capable general-purpose LLM with strong, controllable reasoning capabilities",
121122
},
122123
"moonshotai/Kimi-K2-Instruct-0905": {
123-
maxTokens: 168_000,
124+
maxTokens: 16_384,
124125
contextWindow: 262_000,
125126
supportsImages: false,
126127
supportsPromptCache: false,

0 commit comments

Comments
 (0)