Unverified 提交 56949341 authored 作者: Will Chen's avatar Will Chen 提交者: GitHub

Lower o3/o4 mini max output tokens to maximize input tokens (#424)

上级 d69284e3
......@@ -44,7 +44,8 @@ export const MODEL_OPTIONS: Record<string, ModelOption[]> = {
name: "o3-mini",
displayName: "o3 mini",
description: "Reasoning model",
maxOutputTokens: 100_000,
// See o4-mini comment below for why we set this to 32k
maxOutputTokens: 32_000,
contextWindow: 200_000,
},
// https://platform.openai.com/docs/models/o4-mini
......@@ -52,7 +53,10 @@ export const MODEL_OPTIONS: Record<string, ModelOption[]> = {
name: "o4-mini",
displayName: "o4 mini",
description: "Reasoning model",
maxOutputTokens: 100_000,
// Technically the max output tokens is 100k, *however* if the user has a lot of input tokens,
// then setting a high max output token will cause the request to fail because
// the max output tokens is *included* in the context window limit.
maxOutputTokens: 32_000,
contextWindow: 200_000,
},
],
......
Markdown 格式
0%
您添加了 0 到此讨论。请谨慎行事。
请先完成此评论的编辑!
注册 或者 后发表评论