{ "epoch": 2.928, "num_input_tokens_seen": 547088, "total_flos": 1.1981315796631552e+16, "train_loss": 1.5843523497222571, "train_runtime": 282.8295, "train_samples_per_second": 10.607, "train_steps_per_second": 0.329 }