gfjiogopdfgdfs commited on
Commit
4b045d6
1 Parent(s): d119bf0

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -8
Dockerfile CHANGED
@@ -18,8 +18,7 @@ USER user
18
 
19
  # Set environment variables
20
  ENV HOME=/home/user \
21
- PATH=/home/user/.local/bin:$PATH \
22
- PIP_USER=1
23
 
24
  # Set the working directory
25
  WORKDIR $HOME/app
@@ -27,11 +26,11 @@ WORKDIR $HOME/app
27
  # Copy the current directory contents into the container at /home/user/app
28
  COPY --chown=user . $HOME/app
29
 
30
- # Clone the aphrodite-engine from the specific branch
31
- RUN git clone --branch feat/exllamav2-support https://github.com/PygmalionAI/aphrodite-engine.git $HOME/aphrodite-engine
32
 
33
- # Install dependencies from the cloned repository
34
- RUN cd $HOME/aphrodite-engine && pip install -e .
35
 
36
  # Install additional dependencies
37
  RUN pip install huggingface-hub hf-transfer
@@ -45,5 +44,5 @@ RUN huggingface-cli download LoneStriker/TinyLlama-1.1B-32k-Instruct-8.0bpw-h8-e
45
  # Expose the port the API server will listen on
46
  EXPOSE 7860
47
 
48
- # Command to run the API server
49
- CMD ["/bin/bash", "-c", "/bin/python3 -m aphrodite.endpoints.openai.api_server -q exl2 --dtype auto -gmu 0.95 --kv-cache-dtype fp8_e5m2 --max-num-seqs 15 --served-model-name "BagelMIsteryTour-v2-8x7B-AWQ" --enforce-eager -tp 4 --port 7860 --host 0.0.0.0 --model ~/goliath-gptq"]
 
18
 
19
  # Set environment variables
20
  ENV HOME=/home/user \
21
+ PATH=/home/user/.local/bin:$PATH
 
22
 
23
  # Set the working directory
24
  WORKDIR $HOME/app
 
26
  # Copy the current directory contents into the container at /home/user/app
27
  COPY --chown=user . $HOME/app
28
 
29
+ # Install aphrodite-engine from PyPI to handle dependencies
30
+ RUN python3 -m pip install aphrodite-engine
31
 
32
+ # Clone the specific branch of aphrodite-engine for the latest features
33
+ RUN git clone --branch feat/exllamav2-support https://github.com/PygmalionAI/aphrodite-engine.git $HOME/aphrodite-engine
34
 
35
  # Install additional dependencies
36
  RUN pip install huggingface-hub hf-transfer
 
44
  # Expose the port the API server will listen on
45
  EXPOSE 7860
46
 
47
+ # Command to run the API server from the cloned directory
48
+ CMD ["/bin/bash", "-c", "cd $HOME/aphrodite-engine && /bin/python3 -m aphrodite.endpoints.openai.api_server -q exl2 --dtype auto -gmu 0.95 --kv-cache-dtype fp8_e5m2 --max-num-seqs 15 --served-model-name "BagelMIsteryTour-v2-8x7B-AWQ" --enforce-eager -tp 4 --port 7860 --host 0.0.0.0 --model ~/goliath-gptq"]