Update Dockerfile

thiner · web-flow · commit 23e5130582bf · 2024-02-19T17:53:56.000+08:00
Install from source
diff --git a/docker/cuda_simple/Dockerfile b/docker/cuda_simple/Dockerfile
@@ -21,7 +21,7 @@ ENV LLAMA_CUBLAS=1
 RUN python3 -m pip install --upgrade pip pytest cmake scikit-build setuptools fastapi uvicorn sse-starlette pydantic-settings starlette-context
 
 # Install llama-cpp-python (build with cuda)
-RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install llama-cpp-python
+RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install -e .[server]
 
 # Run the server
 CMD python3 -m llama_cpp.server