# optimized for coding
# 1. Set Environment Variables
export LD_LIBRARY_PATH="/home/eaman/llama/bin_vulkan" 



# 2. Run the Server
/home/eaman/llama/bin_vulkan/llama-server \
 -m /home/eaman/lm/models/mradermacher/Qwen3.6-35B-A3B.i1-IQ3_M.gguf \
	--host 0.0.0.0 \
	-np 1 \
	-ctk q4_0 \
	-ctv q4_0 \
	-fa on \
	--temp 0.7  --top-k 30 --top-p 0.95 --min-p 0.0 \
	--repeat-penalty 1.0 \
	-b 512 \
	--fit-target 40 \
	--ctx-size 121000 \
	--jinja  \
	--no-mmap \
	--spec-type ngram-mod \
	--spec-ngram-mod-n-match 8 \
	--spec-ngram-mod-n-min 3 \
	--spec-ngram-mod-n-max 24 \
	--cache-ram 6000 -ngl 99 -lv 3 --no-warmup \
