CONFIG = dict( | |
model_name="microsoft/deberta-v3-large", | |
num_classes=6, | |
lr=2e-5, | |
batch_size=8, | |
num_workers=8, | |
max_length=512, | |
weight_decay=0.01, | |
accelerator='gpu', | |
max_epochs=5, | |
accumulate_grad_batches=4, | |
precision=16, | |
gradient_clip_val=1000, | |
train_size=0.8, | |
num_cross_val_splits=5, | |
num_frozen_layers=20, # out of 24 in deberta | |
) | |
# we can also try nn.SmoothL1Loss | |