Update Dockerfile
Browse files- Dockerfile +13 -32
Dockerfile
CHANGED
@@ -1,32 +1,13 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
11 |
-
|
12 |
-
|
13 |
-
|
14 |
-
# Clone the repository into the current directory
|
15 |
-
RUN git clone https://github.com/theroyallab/tabbyAPI .
|
16 |
-
|
17 |
-
# Install torch with CUDA support and exllamav2
|
18 |
-
RUN pip install torch --extra-index-url https://download.pytorch.org/whl/cu121
|
19 |
-
RUN pip install exllamav2
|
20 |
-
|
21 |
-
# Install any other needed packages specified in requirements.txt
|
22 |
-
RUN pip install --no-cache-dir -r requirements.txt
|
23 |
-
|
24 |
-
# Copy the current directory contents into the container at /usr/src/app
|
25 |
-
# Note: This might be redundant if you're cloning everything you need
|
26 |
-
# COPY . /usr/src/app/
|
27 |
-
|
28 |
-
# Make port 5000 available to the world outside this container
|
29 |
-
EXPOSE 5000
|
30 |
-
|
31 |
-
# Run main.py when the container launches
|
32 |
-
CMD ["python3", "main.py"]
|
|
|
1 |
+
FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
|
2 |
+
RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
|
3 |
+
RUN apt update && apt install -y wget
|
4 |
+
ARG MODEL_PART_A
|
5 |
+
ARG MODEL_PART_B
|
6 |
+
ARG MODEL_NAME
|
7 |
+
ARG ADDITIONAL
|
8 |
+
RUN mkdir /opt/kobold
|
9 |
+
RUN git clone https://github.com/0cc4m/KoboldAI -b latestgptq --recurse-submodules /opt/koboldcpp
|
10 |
+
WORKDIR /opt/kobold
|
11 |
+
RUN chmod +x install_requirements.sh
|
12 |
+
RUN ./install_requirements.sh cuda
|
13 |
+
CMD ./play.sh
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|