Spaces:
Runtime error
Runtime error
gfjiogopdfgdfs
commited on
Commit
•
4b045d6
1
Parent(s):
d119bf0
Update Dockerfile
Browse files- Dockerfile +7 -8
Dockerfile
CHANGED
@@ -18,8 +18,7 @@ USER user
|
|
18 |
|
19 |
# Set environment variables
|
20 |
ENV HOME=/home/user \
|
21 |
-
PATH=/home/user/.local/bin:$PATH
|
22 |
-
PIP_USER=1
|
23 |
|
24 |
# Set the working directory
|
25 |
WORKDIR $HOME/app
|
@@ -27,11 +26,11 @@ WORKDIR $HOME/app
|
|
27 |
# Copy the current directory contents into the container at /home/user/app
|
28 |
COPY --chown=user . $HOME/app
|
29 |
|
30 |
-
#
|
31 |
-
RUN
|
32 |
|
33 |
-
#
|
34 |
-
RUN
|
35 |
|
36 |
# Install additional dependencies
|
37 |
RUN pip install huggingface-hub hf-transfer
|
@@ -45,5 +44,5 @@ RUN huggingface-cli download LoneStriker/TinyLlama-1.1B-32k-Instruct-8.0bpw-h8-e
|
|
45 |
# Expose the port the API server will listen on
|
46 |
EXPOSE 7860
|
47 |
|
48 |
-
# Command to run the API server
|
49 |
-
CMD ["/bin/bash", "-c", "/bin/python3 -m aphrodite.endpoints.openai.api_server -q exl2 --dtype auto -gmu 0.95 --kv-cache-dtype fp8_e5m2 --max-num-seqs 15 --served-model-name "BagelMIsteryTour-v2-8x7B-AWQ" --enforce-eager -tp 4 --port 7860 --host 0.0.0.0 --model ~/goliath-gptq"]
|
|
|
18 |
|
19 |
# Set environment variables
|
20 |
ENV HOME=/home/user \
|
21 |
+
PATH=/home/user/.local/bin:$PATH
|
|
|
22 |
|
23 |
# Set the working directory
|
24 |
WORKDIR $HOME/app
|
|
|
26 |
# Copy the current directory contents into the container at /home/user/app
|
27 |
COPY --chown=user . $HOME/app
|
28 |
|
29 |
+
# Install aphrodite-engine from PyPI to handle dependencies
|
30 |
+
RUN python3 -m pip install aphrodite-engine
|
31 |
|
32 |
+
# Clone the specific branch of aphrodite-engine for the latest features
|
33 |
+
RUN git clone --branch feat/exllamav2-support https://github.com/PygmalionAI/aphrodite-engine.git $HOME/aphrodite-engine
|
34 |
|
35 |
# Install additional dependencies
|
36 |
RUN pip install huggingface-hub hf-transfer
|
|
|
44 |
# Expose the port the API server will listen on
|
45 |
EXPOSE 7860
|
46 |
|
47 |
+
# Command to run the API server from the cloned directory
|
48 |
+
CMD ["/bin/bash", "-c", "cd $HOME/aphrodite-engine && /bin/python3 -m aphrodite.endpoints.openai.api_server -q exl2 --dtype auto -gmu 0.95 --kv-cache-dtype fp8_e5m2 --max-num-seqs 15 --served-model-name "BagelMIsteryTour-v2-8x7B-AWQ" --enforce-eager -tp 4 --port 7860 --host 0.0.0.0 --model ~/goliath-gptq"]
|