VideoLLaMA2-AV / requirements.txt
youngsheen's picture
add requirements.txt
e818756
raw
history blame
627 Bytes
# basic dependencies
torch==2.2.0
torchaudio==2.2.0
torchvision==0.17.0
transformers==4.42.3
tokenizers==0.19.1
deepspeed==0.13.1
accelerate==0.26.1
peft==0.4.0
timm==1.0.3
numpy==1.24.4
# data processing
decord==0.6.0
imageio==2.34.0
imageio-ffmpeg==0.4.9
moviepy==1.0.3
scenedetect==0.6.3
opencv-python==4.6.0.66
pysubs2
librosa
pytorchvideo
# misc
scikit-learn==1.2.2
huggingface_hub==0.23.4
sentencepiece==0.1.99
shortuuid
einops==0.6.1
einops-exts==0.0.4
bitsandbytes==0.43.0
pydantic>=2.0
markdown2[all]
gradio==3.50.0
gradio_client==0.6.1
httpx==0.24.1
openai==1.33.0
requests
uvicorn
fastapi
tensorboard
wandb
tabulate