pip3 install llama-cpp-python
wget https://huggingface.co/.../model.gguf
llama-server -m model.gguf --host ::1 --port 8765 -c 8192 &
curl -s http://[::1]:8765/