export CUDA_VISIBLE_DEVICES=0 tritonserver --model-repository=./model_repo_sense_voice_small \ --pinned-memory-pool-byte-size=2048000000 --cuda-memory-pool-byte-size=0:4096000000