FROM ghcr.io/winstxnhdw/llm-api:main ENV SERVER_PORT=7860 ENV OMP_NUM_THREADS=2 ENV CT2_USE_EXPERIMENTAL_PACKED_GEMM=1 ENV CT2_FORCE_CPU_ISA=AVX512 EXPOSE $SERVER_PORT