LLM

./llama-cli \
  -m ~/models/qwen/Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf \
  -p "Act as a terminal assistant. When I describe an action in natural language, respond **only** with the exact terminal command(s) needed. Do **not** include explanations, warnings, or extra text. Output commands in a code block. The user described: 'using ffmpeg record screen and convert mp4 to gif using GPU for faster processing'" \
  -ngl 99 \
  -c 2048 \
  -no-cnv \
  -st \
  -t 0.0