Azam

Files changed (6) hide show

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3175558e8e61233286d0233755e426ebc33a4a0ee9d88efeabc91b0969dd0d6c
 size 2498522505

 version https://git-lfs.github.com/spec/v1
+oid sha256:2251f8fb6941a79db7b7c8f419235cd1d3a8ab37174d57517d90234d4e41a471
 size 2498522505

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b83378c33a6ea5b49584394b6889d866dda8704d4223b7e012cbbcb8bc2469dc
 size 1266130541

 version https://git-lfs.github.com/spec/v1
+oid sha256:93536e6e0a8eb02eb18680c9457964a62569508e9def6f8c9dc2c61aac2fa178
 size 1266130541

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2d6c598ad1ff03fdbae199c042313f72c379e59a7adc5c986920487ec0ef0f0
 size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:59d3437cc781f60db7f0c4ec11b98c7820ced9da2ab517212a97208c81e0a031
 size 14503

scaler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a4b9accfbdcb85276435ad005655da973cd6905daf1d6df04732beae9fcc5608
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:8139a2d5a513b92ca7751a538153ea76a749e3742836b6044f8c530ae1149fb6
 size 559

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0408533f367f94f43315c4942763b084245dd96c78cefc95eb3b423200fa39bb
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:748aacfdb5198e403336e1866da3fd45d311cf7ebe83e327e4ae797f20a0f0f0
 size 623

trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.5694444444444446,
-  "global_step": 740,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -1101,26 +1101,11 @@
       "eval_samples_per_second": 6.423,
       "eval_steps_per_second": 1.606,
       "step": 730
-    },
-    {
-      "epoch": 2.57,
-      "learning_rate": 1.4467592592592593e-05,
-      "loss": 0.3625,
-      "step": 740
-    },
-    {
-      "epoch": 2.57,
-      "eval_accuracy": 0.8003472089767456,
-      "eval_loss": 0.5525452494621277,
-      "eval_runtime": 90.5733,
-      "eval_samples_per_second": 6.359,
-      "eval_steps_per_second": 1.59,
-      "step": 740
     }
   ],
   "max_steps": 864,
   "num_train_epochs": 3,
-  "total_flos": 2.187634079192584e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.5347222222222223,
+  "global_step": 730,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 6.423,
       "eval_steps_per_second": 1.606,
       "step": 730
     }
   ],
   "max_steps": 864,
   "num_train_epochs": 3,
+  "total_flos": 2.1573660231214095e+18,
   "trial_name": null,
   "trial_params": null
 }