From 8a7ef4db59668f9dda841a9550abd1cc78651fa3 Mon Sep 17 00:00:00 2001 From: John Cummings Date: Tue, 24 Sep 2024 11:17:17 -0600 Subject: [PATCH] ollama: Add max tokens for qwen2.5-coder (#18290) --- crates/ollama/src/ollama.rs | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/crates/ollama/src/ollama.rs b/crates/ollama/src/ollama.rs index 51c48290488147800ce6d989593a13995396f309..e592bfa17717d36c102f654d2573ace3947053b3 100644 --- a/crates/ollama/src/ollama.rs +++ b/crates/ollama/src/ollama.rs @@ -82,7 +82,8 @@ fn get_max_tokens(name: &str) -> usize { "llama3" | "gemma2" | "gemma" | "codegemma" | "starcoder" | "aya" => 8192, "codellama" | "starcoder2" => 16384, "mistral" | "codestral" | "mixstral" | "llava" | "qwen2" | "dolphin-mixtral" => 32768, - "llama3.1" | "phi3" | "phi3.5" | "command-r" | "deepseek-coder-v2" | "yi-coder" => 128000, + "llama3.1" | "phi3" | "phi3.5" | "command-r" | "deepseek-coder-v2" | "yi-coder" + | "qwen2.5-coder" => 128000, _ => DEFAULT_TOKENS, } .clamp(1, MAXIMUM_TOKENS)