feat(llm): add deepseek reasoning flag and rename GPU layers

Update the LLM server command construction to include a new `--reasoning-format deepseek` argument, enabling explicit selection of the DeepSeek reasoning format. Replace the short `-ngl` flag with the more descriptive `--n-gpu-layers` to improve readability and consistency with other CLI options. This change enhances configurability for models requiring specific reasoning formats and clarifies GPU layer configuration.
This commit is contained in:
Rodrigo Rodriguez (Pragmatismo) 2025-11-07 17:16:58 -03:00
parent 312503ae66
commit 5379e21bfe

View file

@ -204,7 +204,7 @@ pub async fn start_llm_server(
// Build command arguments dynamically // Build command arguments dynamically
let mut args = format!( let mut args = format!(
"-m {} --host 0.0.0.0 --port {} --top_p 0.95 --temp 0.6 --repeat-penalty 1.2 -ngl {}", "-m {} --host 0.0.0.0 --port {} --reasoning-format deepseek --top_p 0.95 --temp 0.6 --repeat-penalty 1.2 --n-gpu-layers {}",
model_path, port, gpu_layers model_path, port, gpu_layers
); );
if !reasoning_format.is_empty() { if !reasoning_format.is_empty() {