open-cortex / makefile
peninsula123's picture
feat(main): stream metrics fetch
828386c
Raw
History Blame Contribute Delete
240 Bytes
llama-server:
llama-server \
-hf Qwen/Qwen2.5-1.5B-Instruct-GGUF:Q4_K_M \
-c 2048 -t 8 -tb 8 \
--metrics \
--host 127.0.0.1 --port 8080
llama-cli:
llama-cli \
-hf Qwen/Qwen2.5-1.5B-Instruct-GGUF:Q4_K_M \
-c 2048 -t 8 \
-n 128 -cnv