from transformers import AutoModel model = AutoModel.from_pretrained("nvidia/Llama3-ChatQA-1.5-8B")