feat(llm): add deepseek reasoning flag and rename GPU layers
Update the LLM server command construction to include a new `--reasoning-format deepseek` argument, enabling explicit selection of the DeepSeek reasoning format. Replace the short `-ngl` flag with the more descriptive `--n-gpu-layers` to improve readability and consistency with other CLI options. This change enhances configurability for models requiring specific reasoning formats and clarifies GPU layer configuration.
This commit is contained in:
parent
312503ae66
commit
5379e21bfe
1 changed files with 1 additions and 1 deletions
|
|
@ -204,7 +204,7 @@ pub async fn start_llm_server(
|
||||||
|
|
||||||
// Build command arguments dynamically
|
// Build command arguments dynamically
|
||||||
let mut args = format!(
|
let mut args = format!(
|
||||||
"-m {} --host 0.0.0.0 --port {} --top_p 0.95 --temp 0.6 --repeat-penalty 1.2 -ngl {}",
|
"-m {} --host 0.0.0.0 --port {} --reasoning-format deepseek --top_p 0.95 --temp 0.6 --repeat-penalty 1.2 --n-gpu-layers {}",
|
||||||
model_path, port, gpu_layers
|
model_path, port, gpu_layers
|
||||||
);
|
);
|
||||||
if !reasoning_format.is_empty() {
|
if !reasoning_format.is_empty() {
|
||||||
|
|
|
||||||
Loading…
Add table
Reference in a new issue