Spaces:
Runtime error
Runtime error
| # 設定工作目錄 | |
| export WORK="/home/user/app" | |
| cd "$WORK" || exit 1 | |
| # 建立 Python 虛擬環境 (可選) | |
| python3 -m venv venv | |
| source venv/bin/activate | |
| # 安裝 Python 套件 | |
| pip install --upgrade pip | |
| pip install gradio openai aiohttp | |
| echo "Unzip and download model..." | |
| unzip llama_cpp_avx512.zip > /dev/null 2>&1 | |
| #wget -O model.gguf https://huggingface.co/Intel/gpt-oss-20b-gguf-q4ks-AutoRound/resolve/main/gpt-oss-20b-32x2.4B-Q4_K_S.gguf > /dev/null 2>&1 | |
| wget -O model.gguf https://huggingface.co/unsloth/gpt-oss-20b-GGUF/resolve/main/gpt-oss-20b-Q4_K_M.gguf > /dev/null 2>&1 | |
| echo "Start llama.cpp server..." | |
| nohup ./llama-server \ | |
| -m model.gguf \ | |
| --port 8000 \ | |
| --host 0.0.0.0 \ | |
| --threads 2 \ | |
| --ctx-size 131027 \ | |
| --mlock \ | |
| --jinja \ | |
| --temp 0.2 \ | |
| --top-p 0.85 \ | |
| -v \ | |
| > llama.log 2>&1 & | |
| # 持續監控 log,但不阻塞 python app.py | |
| #tail -n 50 -f llama.log & | |
| #sleep 200 | |
| echo "Start app.py..." | |
| python app.py | |