eval_loss = 0.4353837760334665 f1_score = 0.6748412349722412 precision = 0.7272727272727273 recall = 0.6294612920050667