From bd9f0febb18b4e42fa51b86e8c9037021c9681bc Mon Sep 17 00:00:00 2001
From: "Sebastian.W" <thiner@gmail.com>
Date: Mon, 19 Feb 2024 16:32:56 +0800
Subject: [PATCH 1/3] Update build-docker.yaml

---
 .github/workflows/build-docker.yaml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build-docker.yaml b/.github/workflows/build-docker.yaml
index 750b91e1f..014a377f7 100644
--- a/.github/workflows/build-docker.yaml
+++ b/.github/workflows/build-docker.yaml
@@ -39,8 +39,8 @@ jobs:
           pull: true
           platforms: linux/amd64,linux/arm64
           tags: |
-            ghcr.io/abetlen/llama-cpp-python:latest
-            ghcr.io/abetlen/llama-cpp-python:${{ github.ref_name }}
+            ghcr.io/thiner/llama-cpp-python:latest
+            ghcr.io/thiner/llama-cpp-python:${{ github.ref_name }}
           build-args: |
             BUILDKIT_INLINE_CACHE=1
 

From 5e90adc83bde29c098474473f493cc235892e05d Mon Sep 17 00:00:00 2001
From: "Sebastian.W" <thiner@gmail.com>
Date: Mon, 19 Feb 2024 17:51:06 +0800
Subject: [PATCH 2/3] Update build-docker.yaml

---
 .github/workflows/build-docker.yaml | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/build-docker.yaml b/.github/workflows/build-docker.yaml
index 014a377f7..e190b2b20 100644
--- a/.github/workflows/build-docker.yaml
+++ b/.github/workflows/build-docker.yaml
@@ -34,13 +34,13 @@ jobs:
         uses: docker/build-push-action@v4
         with:
           context: .
-          file: "docker/simple/Dockerfile"
+          file: "docker/cuda_simple/Dockerfile"
           push: ${{ startsWith(github.ref, 'refs/tags/') }}
           pull: true
           platforms: linux/amd64,linux/arm64
           tags: |
-            ghcr.io/thiner/llama-cpp-python:latest
-            ghcr.io/thiner/llama-cpp-python:${{ github.ref_name }}
+            ghcr.io/thiner/llama-cpp-python:latest-cuda
+            ghcr.io/thiner/llama-cpp-python:${{ github.ref_name }}-cuda
           build-args: |
             BUILDKIT_INLINE_CACHE=1
 

From 23e5130582bfad0026f63644d0135f21977d3276 Mon Sep 17 00:00:00 2001
From: "Sebastian.W" <thiner@gmail.com>
Date: Mon, 19 Feb 2024 17:53:56 +0800
Subject: [PATCH 3/3] Update Dockerfile

Install from source
---
 docker/cuda_simple/Dockerfile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/cuda_simple/Dockerfile b/docker/cuda_simple/Dockerfile
index a9e51cdc1..8e0f2f9b0 100644
--- a/docker/cuda_simple/Dockerfile
+++ b/docker/cuda_simple/Dockerfile
@@ -21,7 +21,7 @@ ENV LLAMA_CUBLAS=1
 RUN python3 -m pip install --upgrade pip pytest cmake scikit-build setuptools fastapi uvicorn sse-starlette pydantic-settings starlette-context
 
 # Install llama-cpp-python (build with cuda)
-RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install llama-cpp-python
+RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install -e .[server]
 
 # Run the server
 CMD python3 -m llama_cpp.server