LLM
./llama-cli \
-m ~/models/qwen/Qwen2.5-Coder-7B-Instruct-Q4_K_M.gguf \
-p "Act as a terminal assistant. When I describe an action in natural language, respond **only** with the exact terminal command(s) needed. Do **not** include explanations, warnings, or extra text. Output commands in a code block. The user described: 'using ffmpeg record screen and convert mp4 to gif using GPU for faster processing'" \
-ngl 99 \
-c 2048 \
-no-cnv \
-st \
-t 0.0