Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- start "" /High /B /Wait llama-server.exe ^
- -m "G:\LLM\models\GLM-4.5-Air-Q4_K_S\GLM-4.5-Air-Q4_K_S-00001-of-00002.gguf" ^
- -c 32768 ^
- -t 5 ^
- -fa on --prio-batch 2 -ub 2048 -b 2048 ^
- -ctk q8_0 -ctv q8_0 ^
- -ngl 999 ^
- -ot "blk.1\.ffn_.*_exps\.=CUDA0,blk.2\.ffn_.*_exps\.=CUDA0,blk.3\.ffn_.*_exps\.=CUDA0,blk.4\.ffn_.*_exps\.=CUDA0,blk.5\.ffn_.*_exps\.=CUDA0" ^
- --cpu-moe ^
- --no-context-shift ^
- --no-mmap
Advertisement
Add Comment
Please, Sign In to add comment