gfjiogopdfgdfs commited on
Commit
3a5ba54
1 Parent(s): cd48a0e

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +1 -1
Dockerfile CHANGED
@@ -24,4 +24,4 @@ ENV HF_HUB_ENABLE_HF_TRANSFER=1
24
  RUN huggingface-cli download brucethemoose/Yi-34B-200K-RPMerge --local-dir $HOME/goliath-gptq --local-dir-use-symlinks False --cache-dir $HOME/cache
25
  EXPOSE 7860
26
  # Should expose on all network interfaces so 0.0.0.0 not only localhost
27
- CMD /bin/bash -c '/bin/python3 -m aphrodite.endpoints.openai.api_server --dtype auto --max-parallel-loading-workers 4 -gmu 0.95 --kv-cache-dtype fp8 --max-num-seqs 15 --served-model-name "brucethemoose/Yi-34B-200K-RPMerge" --enforce-eager --port 7860 --host 0.0.0.0 --model ~/goliath-gptq'
 
24
  RUN huggingface-cli download brucethemoose/Yi-34B-200K-RPMerge --local-dir $HOME/goliath-gptq --local-dir-use-symlinks False --cache-dir $HOME/cache
25
  EXPOSE 7860
26
  # Should expose on all network interfaces so 0.0.0.0 not only localhost
27
+ CMD /bin/bash -c '/bin/python3 -m aphrodite.endpoints.openai.api_server --dtype auto --max-parallel-loading-workers 4 -gmu 0.95 --kv-cache-dtype fp8_e5m2 --max-num-seqs 15 --served-model-name "brucethemoose/Yi-34B-200K-RPMerge" --enforce-eager --port 7860 --host 0.0.0.0 --model ~/goliath-gptq'