mirror of
https://github.com/zadam/trilium.git
synced 2026-06-26 19:21:42 +02:00
fix(llm): thinking budget mismatch
This commit is contained in:
@@ -11,6 +11,8 @@ export interface ChatConfig {
|
||||
systemPrompt?: string;
|
||||
enableWebSearch?: boolean;
|
||||
enableExtendedThinking?: boolean;
|
||||
/** Token budget for extended thinking (default: 10000) */
|
||||
thinkingBudget?: number;
|
||||
}
|
||||
|
||||
export interface Citation {
|
||||
|
||||
@@ -52,9 +52,12 @@ export class AnthropicProvider implements LlmProvider {
|
||||
|
||||
// Enable extended thinking for deeper reasoning
|
||||
if (config.enableExtendedThinking) {
|
||||
const thinkingBudget = config.thinkingBudget || 10000;
|
||||
// max_tokens must be greater than thinking budget
|
||||
streamParams.max_tokens = Math.max(streamParams.max_tokens, thinkingBudget + 4000);
|
||||
(streamParams as any).thinking = {
|
||||
type: "enabled",
|
||||
budget_tokens: 10000 // Allow up to 10k tokens for thinking
|
||||
budget_tokens: thinkingBudget
|
||||
};
|
||||
}
|
||||
|
||||
|
||||
@@ -29,6 +29,8 @@ export interface LlmProviderConfig {
|
||||
enableWebSearch?: boolean;
|
||||
/** Enable extended thinking for deeper reasoning */
|
||||
enableExtendedThinking?: boolean;
|
||||
/** Token budget for extended thinking (default: 10000) */
|
||||
thinkingBudget?: number;
|
||||
}
|
||||
|
||||
export interface LlmProvider {
|
||||
|
||||
Reference in New Issue
Block a user