ollama: Add max tokens for qwen2.5-coder (#18290)

This commit is contained in:
John Cummings 2024-09-24 11:17:17 -06:00 committed by GitHub
parent fd07fef4db
commit 8a7ef4db59
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -82,7 +82,8 @@ fn get_max_tokens(name: &str) -> usize {
"llama3" | "gemma2" | "gemma" | "codegemma" | "starcoder" | "aya" => 8192,
"codellama" | "starcoder2" => 16384,
"mistral" | "codestral" | "mixstral" | "llava" | "qwen2" | "dolphin-mixtral" => 32768,
"llama3.1" | "phi3" | "phi3.5" | "command-r" | "deepseek-coder-v2" | "yi-coder" => 128000,
"llama3.1" | "phi3" | "phi3.5" | "command-r" | "deepseek-coder-v2" | "yi-coder"
| "qwen2.5-coder" => 128000,
_ => DEFAULT_TOKENS,
}
.clamp(1, MAXIMUM_TOKENS)