SystemAdmin123 commited on
Commit
0294c91
·
verified ·
1 Parent(s): ac0505f

Training in progress, step 20, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c914af7e4717984588deb34667879d37816d8425bf9f40c7f2df62411adc325a
3
  size 4140280
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ffbf8790409dcc7f8ae4e5a4966c936a38f8b35fdd2d824e7615da66bc2eed9
3
  size 4140280
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f1d4cc7e69b6d4ecabbbf7997c661f2f6b544b7bb70ab8878c1272f23010f6f
3
  size 4291766
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40cdddd868b8628780578eafdc62f083f38c7191db137d46765fb42910c21aa2
3
  size 4291766
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4651e32e118f1ea1a8e26dfbbe64298593e12e6a71bcd36cb77f04f86d3f86d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02bd6697dd0ac01f79967d93e880e93c5ad7e5d6a672668dd596f9f42c435066
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0c1eba909fbb51daca773a25c075f182b4096aff21c9b4ff19dbada2080ac99
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1946c0d35865c02655624537450071d8e3a581f1d24f3c539357cae293b3d2d2
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:28adb9f06e220aefdc723ea4380a84d42b8bfb87cc53ce65859d55ce1876f51c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9faf933c304288a566e09316737d2bdccb42e76da4138d98110982bcbf5dbf1
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:423c49ed521f6986d20d8b29112b383f4b0f3f2e228084ef82c2ad7dcd5d1de8
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f2cb6de5c0f2b78c1515e90a9ab03144587d336dd27fc87023f09785c5d64cb
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a60c7d771c1fd156acee762fba03c724cb41829a3f71df370ecd1d20b134982
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84f22729b765b6841bd185712dd3ab8bf338866cd8396b5dce62f9950913691a
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 16.666666666666668,
5
- "eval_steps": 200,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,9 +11,9 @@
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 10.377338409423828,
14
- "eval_runtime": 2.3495,
15
- "eval_samples_per_second": 638.849,
16
- "eval_steps_per_second": 5.107,
17
  "step": 1
18
  },
19
  {
@@ -31,67 +31,19 @@
31
  "step": 20
32
  },
33
  {
34
- "epoch": 5.0,
35
- "grad_norm": 0.45703125,
36
- "learning_rate": 0.00016772815716257412,
37
- "loss": 10.2229,
38
- "step": 30
39
- },
40
- {
41
- "epoch": 6.666666666666667,
42
- "grad_norm": 0.458984375,
43
- "learning_rate": 0.00014016954246529696,
44
- "loss": 10.1217,
45
- "step": 40
46
- },
47
- {
48
- "epoch": 8.333333333333334,
49
- "grad_norm": 0.4609375,
50
- "learning_rate": 0.00010825793454723325,
51
- "loss": 10.0382,
52
- "step": 50
53
- },
54
- {
55
- "epoch": 10.0,
56
- "grad_norm": 0.4609375,
57
- "learning_rate": 7.54514512859201e-05,
58
- "loss": 9.9768,
59
- "step": 60
60
- },
61
- {
62
- "epoch": 11.666666666666666,
63
- "grad_norm": 0.4609375,
64
- "learning_rate": 4.530518418775733e-05,
65
- "loss": 9.9373,
66
- "step": 70
67
- },
68
- {
69
- "epoch": 13.333333333333334,
70
- "grad_norm": 0.462890625,
71
- "learning_rate": 2.1085949060360654e-05,
72
- "loss": 9.9182,
73
- "step": 80
74
- },
75
- {
76
- "epoch": 15.0,
77
- "grad_norm": 0.46484375,
78
- "learning_rate": 5.418275829936537e-06,
79
- "loss": 9.9122,
80
- "step": 90
81
- },
82
- {
83
- "epoch": 16.666666666666668,
84
- "grad_norm": 0.462890625,
85
- "learning_rate": 0.0,
86
- "loss": 9.9115,
87
- "step": 100
88
  }
89
  ],
90
  "logging_steps": 10,
91
  "max_steps": 100,
92
  "num_input_tokens_seen": 0,
93
  "num_train_epochs": 17,
94
- "save_steps": 200,
95
  "stateful_callbacks": {
96
  "TrainerControl": {
97
  "args": {
@@ -99,12 +51,12 @@
99
  "should_evaluate": false,
100
  "should_log": false,
101
  "should_save": true,
102
- "should_training_stop": true
103
  },
104
  "attributes": {}
105
  }
106
  },
107
- "total_flos": 164363029708800.0,
108
  "train_batch_size": 32,
109
  "trial_name": null,
110
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.3333333333333335,
5
+ "eval_steps": 20,
6
+ "global_step": 20,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 0.16666666666666666,
13
  "eval_loss": 10.377338409423828,
14
+ "eval_runtime": 2.3538,
15
+ "eval_samples_per_second": 637.683,
16
+ "eval_steps_per_second": 5.098,
17
  "step": 1
18
  },
19
  {
 
31
  "step": 20
32
  },
33
  {
34
+ "epoch": 3.3333333333333335,
35
+ "eval_loss": 10.274003028869629,
36
+ "eval_runtime": 2.365,
37
+ "eval_samples_per_second": 634.681,
38
+ "eval_steps_per_second": 5.074,
39
+ "step": 20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
40
  }
41
  ],
42
  "logging_steps": 10,
43
  "max_steps": 100,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 17,
46
+ "save_steps": 20,
47
  "stateful_callbacks": {
48
  "TrainerControl": {
49
  "args": {
 
51
  "should_evaluate": false,
52
  "should_log": false,
53
  "should_save": true,
54
+ "should_training_stop": false
55
  },
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 32872605941760.0,
60
  "train_batch_size": 32,
61
  "trial_name": null,
62
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:767cbb0126f5e19779e9fcc2851f3166d36ca132f2aa13429b17ffa28b07b942
3
  size 6904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa3a4fef869eec54885a3e827a7faceb53e864a7600488a249371d1dec63ce95
3
  size 6904