winstxnhdw commited on
Commit
1cc3f06
1 Parent(s): e01c6a6

perf/build/docs: use translator threads instead of workers

Browse files
Files changed (2) hide show
  1. Dockerfile +2 -2
  2. README.md +1 -1
Dockerfile CHANGED
@@ -1,9 +1,9 @@
1
  FROM ghcr.io/winstxnhdw/nllb-api:main
2
 
3
  ENV SERVER_PORT=7860
4
- ENV OMP_NUM_THREADS=2
5
  ENV CT2_USE_EXPERIMENTAL_PACKED_GEMM=1
6
  ENV CT2_FORCE_CPU_ISA=AVX512
7
- ENV WORKER_COUNT=1
8
 
9
  EXPOSE $SERVER_PORT
 
1
  FROM ghcr.io/winstxnhdw/nllb-api:main
2
 
3
  ENV SERVER_PORT=7860
4
+ ENV OMP_NUM_THREADS=1
5
  ENV CT2_USE_EXPERIMENTAL_PACKED_GEMM=1
6
  ENV CT2_FORCE_CPU_ISA=AVX512
7
+ ENV TRANSLATOR_THREADS=4
8
 
9
  EXPOSE $SERVER_PORT
README.md CHANGED
@@ -8,7 +8,7 @@ python_version: 3.12.3
8
  models: [winstxnhdw/nllb-200-distilled-1.3B-ct2-int8]
9
  tags: [translation, translator, nllb, ctranslate2]
10
  pinned: true
11
- base_path: /schema/swagger
12
  ---
13
 
14
  Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
 
8
  models: [winstxnhdw/nllb-200-distilled-1.3B-ct2-int8]
9
  tags: [translation, translator, nllb, ctranslate2]
10
  pinned: true
11
+ base_path: /api/schema/swagger
12
  ---
13
 
14
  Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference