mono/packages/kbot/cpp/scripts/run-7b.sh
2026-03-30 12:07:13 +02:00

10 lines
207 B
Bash

llama-server.exe \
--hf-repo paultimothymooney/Qwen2.5-7B-Instruct-Q4_K_M-GGUF \
--hf-file qwen2.5-7b-instruct-q4_k_m.gguf \
-t 16 \
-c 2048 \
-b 512 \
--temp 0.2 \
--top-p 0.9 \
--port 8888