From 694fb91efefe11b2d0f639a1679e7678f56508c2 Mon Sep 17 00:00:00 2001 From: "Rodrigo Rodriguez (Pragmatismo)" Date: Sun, 12 Apr 2026 09:59:49 -0300 Subject: [PATCH] Add comment about batch_size reduction for llama-server stability --- src/core/kb/embedding_generator.rs | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/core/kb/embedding_generator.rs b/src/core/kb/embedding_generator.rs index 2c149a90..0249b2c9 100644 --- a/src/core/kb/embedding_generator.rs +++ b/src/core/kb/embedding_generator.rs @@ -43,7 +43,7 @@ impl Default for EmbeddingConfig { embedding_model: "BAAI/bge-multilingual-gemma2".to_string(), embedding_key: None, dimensions: 2048, - batch_size: 2, + batch_size: 2, // Reduced from 16 to prevent llama-server crash timeout_seconds: 60, max_concurrent_requests: 1, connect_timeout_seconds: 10,