| { | |
| "source_path": "pretraining_logs_lr_001_OPTIMIZED_clean_restart/train/runs/2025-09-08_02-33-22/checkpoints/best/step-487500-val_ppl-3.72168.ckpt", | |
| "file_size_mb": 852.6802940368652, | |
| "analysis_time": "2025-11-17T23:42:54.899686", | |
| "global_step": 487500, | |
| "epoch": 0, | |
| "lightning_version": "2.5.1.post0", | |
| "step_from_filename": 487500, | |
| "learning_rate": 0.001, | |
| "model_name": "green-run-optimized-t5-base-sci-cp-en-487k-steps-lr0001-clip1", | |
| "batch_size": null, | |
| "run_info": { | |
| "run_name": "green-run-optimized", | |
| "run_type": "green-optimized", | |
| "base_model": "t5-base", | |
| "base_model_hf": "t5-base", | |
| "learning_rate": 0.001, | |
| "gradient_clip": 1.0, | |
| "scheduler": "inverse_sqrt", | |
| "warmup_steps": 20000, | |
| "config_name": "t5_continued_pretraining_lr_001_OPTIMIZED_clean_restart.yaml", | |
| "full_name_template": "green-run-optimized-t5-base-sci-cp-en-{steps}k-steps-lr0001-clip1" | |
| }, | |
| "base_model": "t5-base", | |
| "training_type": "continued_pretraining", | |
| "gradient_clip": 1.0, | |
| "scheduler": "inverse_sqrt", | |
| "warmup_steps": 20000, | |
| "config_name": "t5_continued_pretraining_lr_001_OPTIMIZED_clean_restart.yaml", | |
| "analysis_error": "could not convert string to float: '3.72168.'", | |
| "conversion_time": "2025-11-17T23:43:06.934716", | |
| "output_path": "converted_models/hf_release/en-t5-sci-continued-pretraining-487k/green-optimized-run-models/green-run-optimized-t5-base-sci-cp-en-487k-steps-lr0001-clip1", | |
| "base_model_id": "t5-base", | |
| "base_model_used": "/netscratch/nrauscher/projects/BA-hydra/converted_models/baselines/t5-base", | |
| "missing_keys": 0, | |
| "unexpected_keys": 0 | |
| } |