train_runtime': 483.9556 r = 8 num_train_epochs=1 optim="adamw_torch_fused", lr_scheduler_type="cosine", metric_for_best_model="f1",
Base model