| { | |
| "entropy": 2.5530850489934287, | |
| "epoch": 2.0, | |
| "eval_entropy": 2.5582991441090903, | |
| "eval_loss": 0.4179121255874634, | |
| "eval_mean_token_accuracy": 0.9070041179656982, | |
| "eval_num_tokens": 620664491.0, | |
| "eval_runtime": 0.4825, | |
| "eval_samples": 1000, | |
| "eval_samples_per_second": 373.052, | |
| "eval_steps_per_second": 6.218, | |
| "mean_token_accuracy": 0.902903805176417, | |
| "num_tokens": 620664491.0, | |
| "total_flos": 3.623983417768542e+18, | |
| "train_loss": 0.550684680861008, | |
| "train_runtime": 5178.5318, | |
| "train_samples": 1859300, | |
| "train_samples_per_second": 118.293, | |
| "train_steps_per_second": 0.924, | |
| "weight_norm": 725.9066744423832 | |
| } |