PMBeta / start.py
Sergidev's picture
Update start.py
f590568 verified
raw
history blame
583 Bytes
import subprocess
# commented because the existing llama-cpp-python package was renoved fron requirements.txt
subprocess.run("pip uninstall -y llama-cpp-python", shell=True)
install_command = "CMAKE_ARGS='-DLLAMA_CUBLAS=on -DCUDA_PATH=/usr/local/cuda-12.2 -DCUDAToolkit_ROOT=/usr/local/cuda-12.2 -DCUDAToolkit_INCLUDE_DIR=/usr/local/cuda-12.2/include -DCUDAToolkit_LIBRARY_DIR=/usr/local/cuda-12.2/lib64' FORCE_CMAKE=1 pip install llama-cpp-python --no-cache-dir"
subprocess.run(install_command, shell=True)
subprocess.run("uvicorn app:app --host 0.0.0.0 --port 7860", shell=True)