TwT-6's picture
Upload 2667 files
256a159 verified
raw
history blame
662 Bytes
from opencompass.models import HuggingFaceCausalLM
models = [
dict(
type=HuggingFaceCausalLM,
abbr='deepseek-67b-base-hf',
path="deepseek-ai/deepseek-llm-67b-base",
tokenizer_path='deepseek-ai/deepseek-llm-67b-base',
model_kwargs=dict(
device_map='auto',
trust_remote_code=True,
),
tokenizer_kwargs=dict(
padding_side='left',
truncation_side='left',
trust_remote_code=True,
use_fast=False,
),
max_out_len=100,
max_seq_len=2048,
batch_size=8,
run_cfg=dict(num_gpus=4, num_procs=1),
)
]