-Hardcoded llama tests
Some checks are pending
GBCI / build (push) Waiting to run

This commit is contained in:
Rodrigo Rodriguez (Pragmatismo) 2025-09-11 14:50:45 -03:00
parent f0cdf2047a
commit 4c002eba6a
4 changed files with 20 additions and 11 deletions

View file

@ -17,6 +17,10 @@ apt-get update && apt-get install -y wget
wget https://dl.min.io/server/minio/release/linux-amd64/minio -O /usr/local/bin/minio wget https://dl.min.io/server/minio/release/linux-amd64/minio -O /usr/local/bin/minio
chmod +x /usr/local/bin/minio chmod +x /usr/local/bin/minio
wget https://dl.min.io/client/mc/release/linux-amd64/mc -O /usr/local/bin/mc
chmod +x /usr/local/bin/mc
useradd -r -s /bin/false minio-user || true useradd -r -s /bin/false minio-user || true
mkdir -p /var/log/minio /data mkdir -p /var/log/minio /data
chown -R minio-user:minio-user /var/log/minio /data chown -R minio-user:minio-user /var/log/minio /data

View file

@ -36,6 +36,11 @@ rm llama-b6148-bin-ubuntu-x64.zip
wget https://huggingface.co/bartowski/DeepSeek-R1-Distill-Qwen-1.5B-GGUF/resolve/main/DeepSeek-R1-Distill-Qwen-1.5B-Q3_K_M.gguf wget https://huggingface.co/bartowski/DeepSeek-R1-Distill-Qwen-1.5B-GGUF/resolve/main/DeepSeek-R1-Distill-Qwen-1.5B-Q3_K_M.gguf
wget https://huggingface.co/CompendiumLabs/bge-small-en-v1.5-gguf/resolve/main/bge-small-en-v1.5-f32.gguf wget https://huggingface.co/CompendiumLabs/bge-small-en-v1.5-gguf/resolve/main/bge-small-en-v1.5-f32.gguf
sudo curl -fsSLo /usr/share/keyrings/brave-browser-beta-archive-keyring.gpg https://brave-browser-apt-beta.s3.brave.com/brave-browser-beta-archive-keyring.gpg
sudo curl -fsSLo /etc/apt/sources.list.d/brave-browser-beta.sources https://brave-browser-apt-beta.s3.brave.com/brave-browser.sources
sudo apt update
sudo apt install brave-browser-beta
curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh -s -- -y
source "$HOME/.cargo/env" source "$HOME/.cargo/env"

View file

@ -1,11 +1,11 @@
CREATE TABLE system_automations ( CREATE TABLE public.system_automations (
id uuid PRIMARY KEY, id uuid NOT NULL,
kind NUMBER, kind int4 NULL,
target VARCHAR(32), target varchar(32) NULL,
schedule CHAR(6), schedule bpchar(12) NULL,
param VARCHAR(32) NOT NULL, param varchar(32) NOT NULL,
is_active BOOL NOT NULL DEFAULT TRUE, is_active bool DEFAULT true NOT NULL,
last_triggered TIMESTAMPTZ last_triggered timestamptz NULL,
CONSTRAINT system_automations_pkey PRIMARY KEY (id)
); );
CREATE INDEX idx_active_automations ON public.system_automations USING btree (kind) WHERE is_active;
CREATE INDEX idx_active_automations ON system_automations(kind) WHERE is_active;

View file

@ -187,7 +187,7 @@ async fn start_llm_server(
let mut cmd = tokio::process::Command::new("sh"); let mut cmd = tokio::process::Command::new("sh");
cmd.arg("-c").arg(format!( cmd.arg("-c").arg(format!(
"cd {} && ./llama-server -m {} --host 0.0.0.0 --port {} --n-gpu-layers 99 &", "cd {} && ./llama-server -m {} --host 0.0.0.0 --port {} --threads 8 --threads-batch 18 --temp 0.7 --parallel 3 --repeat-penalty 1.1 --ctx-size 2096 --batch-size 2048 -n 255 --mlock --no-mmap &",
llama_cpp_path, model_path, port llama_cpp_path, model_path, port
)); ));