import subprocess | |
# commented because the existing llama-cpp-python package was renoved fron requirements.txt | |
subprocess.run("pip uninstall -y llama-cpp-python", shell=True) | |
install_command = "CMAKE_ARGS='-DLLAMA_CUBLAS=on -DCUDA_PATH=/usr/local/cuda-12.2 -DCUDAToolkit_ROOT=/usr/local/cuda-12.2 -DCUDAToolkit_INCLUDE_DIR=/usr/local/cuda-12.2/include -DCUDAToolkit_LIBRARY_DIR=/usr/local/cuda-12.2/lib64' FORCE_CMAKE=1 pip install llama-cpp-python --no-cache-dir" | |
subprocess.run(install_command, shell=True) | |
subprocess.run("uvicorn app:app --host 0.0.0.0 --port 7860", shell=True) |