diff --git a/.gitignore b/.gitignore index 905957c45c..983940c711 100644 --- a/.gitignore +++ b/.gitignore @@ -128,3 +128,4 @@ MCP/.env MCP/node_modules Dashboard/public/sw.js .claude/settings.local.json +Common/.claude/settings.local.json diff --git a/Common/Server/Utils/LLM/LLMService.ts b/Common/Server/Utils/LLM/LLMService.ts index e59bbfec60..7a0c1d3715 100644 --- a/Common/Server/Utils/LLM/LLMService.ts +++ b/Common/Server/Utils/LLM/LLMService.ts @@ -16,6 +16,7 @@ export interface LLMMessage { export interface LLMCompletionRequest { messages: Array; temperature?: number; + maxTokens?: number; llmProviderConfig: LLMProviderConfig; } @@ -80,6 +81,7 @@ export default class LLMService { }; }), temperature: request.temperature ?? 0.7, + max_tokens: request.maxTokens || 4096, }, headers: { Authorization: `Bearer ${config.apiKey}`, @@ -153,6 +155,7 @@ export default class LLMService { model: modelName, messages: userMessages, temperature: request.temperature ?? 0.7, + max_tokens: request.maxTokens || 4096, }; if (systemMessage) { @@ -241,6 +244,7 @@ export default class LLMService { stream: false, options: { temperature: request.temperature ?? 0.7, + num_predict: request.maxTokens || 4096, }, }, headers: {