| { | |
| "schema_analysis": { | |
| "metrics": { | |
| "f1_score": 0.8089157550696012, | |
| "precision": 0.8324027324027324, | |
| "recall": 0.8083877833877834 | |
| }, | |
| "num_underpredictions": 210, | |
| "num_overpredictions": 112, | |
| "num_exact_schema_matches": 769, | |
| "avg_dist_gold_serialized": 0.81, | |
| "avg_dist_gold_predicted": 0.93, | |
| "num_hallucinated_schemas": 59 | |
| }, | |
| "sql_analysis": { | |
| "exec": 0.5686070686070686, | |
| "em": 0.5343035343035343, | |
| "malformed_pred_sql": 119, | |
| "correct_over_t5_large": 62, | |
| "items_with_counting_errors": 74, | |
| "edit_up": 0.1083, | |
| "edit_down": 0.7536, | |
| "progress": 0.562877905848566 | |
| } | |
| } |