| { | |
| "epoch": 4.0, | |
| "eval_loss": 0.5301879048347473, | |
| "eval_runtime": 0.5773, | |
| "eval_samples": 99, | |
| "eval_samples_per_second": 133.388, | |
| "eval_steps_per_second": 3.465, | |
| "perplexity": 1.699251576208271, | |
| "total_flos": 340525408321536.0, | |
| "train_loss": 0.3252074327502578, | |
| "train_runtime": 5343.4474, | |
| "train_samples": 73061, | |
| "train_samples_per_second": 41.505, | |
| "train_steps_per_second": 1.297 | |
| } |