/cuda*/ /python/ /venv/ __pycache__ model.json token.txt *.gguf