From 3b65f8536e47ddcacb6c94e7ce1ee50af63fbbe1 Mon Sep 17 00:00:00 2001 From: jimmychen Date: Sun, 29 Mar 2026 08:32:01 -0400 Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0--ngl=E5=8F=82=E6=95=B0?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- llama-cpp.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/llama-cpp.md b/llama-cpp.md index 7d56b8d..4396402 100644 --- a/llama-cpp.md +++ b/llama-cpp.md @@ -1,4 +1,4 @@ -./llama-server --model /home/jimmy/NVME/model/Qwen3.5-35B-A3B-UD-IQ4_XS.gguf --alias "Qwen3.5-35B-A3B" --temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00 --host 0.0.0.0 --port 11434 --kv-unified --cache-type-k q8_0 --cache-type-v q8_0 --flash-attn on --fit on --ctx-size 262144 --jinja --no-mmap -t 24 -np 4 +./llama-server --model /home/jimmy/NVME/model/Qwen3.5-35B-A3B-UD-IQ4_XS.gguf --alias "Qwen3.5-35B-A3B" --temp 0.6 --top-p 0.95 --top-k 20 --min-p 0.00 --host 0.0.0.0 --port 11434 --kv-unified --cache-type-k q8_0 --cache-type-v q8_0 --flash-attn on --fit on --ctx-size 262144 --jinja --no-mmap -t 24 -np 4 --ngl 999 context_size 128K = 131072