does-deepspeed-still-work-sft / all_results.json
lewtun's picture
lewtun HF Staff
End of training
381693b verified
{
"eval_loss": 1.116114616394043,
"eval_runtime": 0.664,
"eval_samples": 200,
"eval_samples_per_second": 301.2,
"eval_steps_per_second": 6.024,
"total_flos": 4.8695749825160806e+17,
"train_loss": 1.088731300446295,
"train_runtime": 315.8129,
"train_samples": 15806,
"train_samples_per_second": 100.097,
"train_steps_per_second": 0.785
}