fix: maxCompletionTokens Implementation for All Providers (#1938)

* Update LLM providers and constants

- Updated constants in app/lib/.server/llm/constants.ts
- Modified stream-text functionality in app/lib/.server/llm/stream-text.ts
- Updated Anthropic provider in app/lib/modules/llm/providers/anthropic.ts
- Modified GitHub provider in app/lib/modules/llm/providers/github.ts
- Updated Google provider in app/lib/modules/llm/providers/google.ts
- Modified OpenAI provider in app/lib/modules/llm/providers/openai.ts
- Updated LLM types in app/lib/modules/llm/types.ts
- Modified API route in app/routes/api.llmcall.ts

* Fix maxCompletionTokens Implementation for All Providers

 - Cohere: Added maxCompletionTokens: 4000 to all 10 static models
  - DeepSeek: Added maxCompletionTokens: 8192 to all 3 static models
  - Groq: Added maxCompletionTokens: 8192 to both static models
  - Mistral: Added maxCompletionTokens: 8192 to all 9 static models
  - Together: Added maxCompletionTokens: 8192 to both static models

  - Groq: Fixed getDynamicModels to include maxCompletionTokens: 8192
  - Together: Fixed getDynamicModels to include maxCompletionTokens: 8192
  - OpenAI: Fixed getDynamicModels with proper logic for reasoning models (o1: 16384, o1-mini: 8192) and standard models
This commit is contained in:
Stijnus
2025-08-29 23:13:58 +02:00
committed by GitHub
parent 38c13494c2
commit ff8b0d7af1
6 changed files with 169 additions and 23 deletions

View File

@@ -22,6 +22,7 @@ export default class TogetherProvider extends BaseProvider {
label: 'Llama 3.2 90B Vision',
provider: 'Together',
maxTokenAllowed: 128000,
maxCompletionTokens: 8192,
},
// Mixtral 8x7B: 32k context, strong performance
@@ -30,6 +31,7 @@ export default class TogetherProvider extends BaseProvider {
label: 'Mixtral 8x7B Instruct',
provider: 'Together',
maxTokenAllowed: 32000,
maxCompletionTokens: 8192,
},
];
@@ -67,6 +69,7 @@ export default class TogetherProvider extends BaseProvider {
label: `${m.display_name} - in:$${m.pricing.input.toFixed(2)} out:$${m.pricing.output.toFixed(2)} - context ${Math.floor(m.context_length / 1000)}k`,
provider: this.name,
maxTokenAllowed: 8000,
maxCompletionTokens: 8192,
}));
}