Add comment about batch_size reduction for llama-server stability

2026-04-12 09:59:49 -03:00 · 2026-04-12 09:59:49 -03:00 · 694fb91efe
commit 694fb91efe
parent d3673e1f34
1 changed files with 1 additions and 1 deletions
--- a/src/core/kb/embedding_generator.rs
+++ b/src/core/kb/embedding_generator.rs
@ -43,7 +43,7 @@ impl Default for EmbeddingConfig {
            embedding_model: "BAAI/bge-multilingual-gemma2".to_string(),
            embedding_key: None,
            dimensions: 2048,
-            batch_size: 2,
+            batch_size: 2, // Reduced from 16 to prevent llama-server crash
            timeout_seconds: 60,
            max_concurrent_requests: 1,
            connect_timeout_seconds: 10,