Training in progress, step 300
Browse files
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4986211280
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12c9a3aac0fe1a3b7ae85bf60328212e49ef81b52ec54043b4188d1fc35f6e9f
|
3 |
size 4986211280
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847344
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a6b75ecc32886f9fb5a82ad02512a1377aa626688027eb5c9932502892e4a3c
|
3 |
size 4954847344
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6435465b368f32be72d340e1f8993295954b628fc18b831a27176c7ab25b6ef9
|
3 |
size 4954847392
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bf1c92a32870ba09b95ef4d61585d5a6448ff9fcb2cbdae668d737307835979
|
3 |
size 4954847392
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4954847392
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22f24dc7132d1a9ac06a252c92133877e9a27d9d251e455fb55ff4648f9a2610
|
3 |
size 4954847392
|
model-00006-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4734533160
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b90254a42bc66c2e8224de869cd641f758184d02f86a9f06c64a3e9b253264e5
|
3 |
size 4734533160
|
trainer_log.jsonl
CHANGED
@@ -201,3 +201,104 @@
|
|
201 |
{"current_steps": 201, "total_steps": 366, "loss": 0.4967, "lr": 5.071614405023938e-06, "epoch": 1.6384720327421554, "percentage": 54.92, "elapsed_time": "4:23:31", "remaining_time": "3:36:19"}
|
202 |
{"current_steps": 202, "total_steps": 366, "loss": 0.5213, "lr": 5.023872193905316e-06, "epoch": 1.6466575716234653, "percentage": 55.19, "elapsed_time": "4:25:07", "remaining_time": "3:35:14"}
|
203 |
{"current_steps": 203, "total_steps": 366, "loss": 0.5002, "lr": 4.976127806094685e-06, "epoch": 1.654843110504775, "percentage": 55.46, "elapsed_time": "4:26:20", "remaining_time": "3:33:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
201 |
{"current_steps": 201, "total_steps": 366, "loss": 0.4967, "lr": 5.071614405023938e-06, "epoch": 1.6384720327421554, "percentage": 54.92, "elapsed_time": "4:23:31", "remaining_time": "3:36:19"}
|
202 |
{"current_steps": 202, "total_steps": 366, "loss": 0.5213, "lr": 5.023872193905316e-06, "epoch": 1.6466575716234653, "percentage": 55.19, "elapsed_time": "4:25:07", "remaining_time": "3:35:14"}
|
203 |
{"current_steps": 203, "total_steps": 366, "loss": 0.5002, "lr": 4.976127806094685e-06, "epoch": 1.654843110504775, "percentage": 55.46, "elapsed_time": "4:26:20", "remaining_time": "3:33:51"}
|
204 |
+
{"current_steps": 204, "total_steps": 366, "loss": 0.4974, "lr": 4.928385594976063e-06, "epoch": 1.6630286493860846, "percentage": 55.74, "elapsed_time": "4:27:33", "remaining_time": "3:32:28"}
|
205 |
+
{"current_steps": 205, "total_steps": 366, "loss": 0.5409, "lr": 4.880649913734996e-06, "epoch": 1.6712141882673943, "percentage": 56.01, "elapsed_time": "4:28:37", "remaining_time": "3:30:58"}
|
206 |
+
{"current_steps": 206, "total_steps": 366, "loss": 0.5423, "lr": 4.832925114961629e-06, "epoch": 1.679399727148704, "percentage": 56.28, "elapsed_time": "4:29:50", "remaining_time": "3:29:34"}
|
207 |
+
{"current_steps": 207, "total_steps": 366, "loss": 0.4958, "lr": 4.785215550253826e-06, "epoch": 1.6875852660300137, "percentage": 56.56, "elapsed_time": "4:31:00", "remaining_time": "3:28:09"}
|
208 |
+
{"current_steps": 208, "total_steps": 366, "loss": 0.5131, "lr": 4.737525569820405e-06, "epoch": 1.6957708049113234, "percentage": 56.83, "elapsed_time": "4:32:27", "remaining_time": "3:26:57"}
|
209 |
+
{"current_steps": 209, "total_steps": 366, "loss": 0.5177, "lr": 4.689859522084457e-06, "epoch": 1.703956343792633, "percentage": 57.1, "elapsed_time": "4:33:48", "remaining_time": "3:25:41"}
|
210 |
+
{"current_steps": 210, "total_steps": 366, "loss": 0.5103, "lr": 4.64222175328687e-06, "epoch": 1.7121418826739427, "percentage": 57.38, "elapsed_time": "4:35:05", "remaining_time": "3:24:20"}
|
211 |
+
{"current_steps": 211, "total_steps": 366, "loss": 0.5332, "lr": 4.594616607090028e-06, "epoch": 1.7203274215552524, "percentage": 57.65, "elapsed_time": "4:36:16", "remaining_time": "3:22:56"}
|
212 |
+
{"current_steps": 212, "total_steps": 366, "loss": 0.5015, "lr": 4.547048424181751e-06, "epoch": 1.728512960436562, "percentage": 57.92, "elapsed_time": "4:37:21", "remaining_time": "3:21:28"}
|
213 |
+
{"current_steps": 213, "total_steps": 366, "loss": 0.5343, "lr": 4.499521541879508e-06, "epoch": 1.7366984993178718, "percentage": 58.2, "elapsed_time": "4:38:37", "remaining_time": "3:20:08"}
|
214 |
+
{"current_steps": 214, "total_steps": 366, "loss": 0.5206, "lr": 4.452040293734934e-06, "epoch": 1.7448840381991815, "percentage": 58.47, "elapsed_time": "4:39:56", "remaining_time": "3:18:49"}
|
215 |
+
{"current_steps": 215, "total_steps": 366, "loss": 0.5419, "lr": 4.40460900913869e-06, "epoch": 1.7530695770804912, "percentage": 58.74, "elapsed_time": "4:41:15", "remaining_time": "3:17:32"}
|
216 |
+
{"current_steps": 216, "total_steps": 366, "loss": 0.5214, "lr": 4.357232012925714e-06, "epoch": 1.7612551159618008, "percentage": 59.02, "elapsed_time": "4:42:40", "remaining_time": "3:16:17"}
|
217 |
+
{"current_steps": 217, "total_steps": 366, "loss": 0.5125, "lr": 4.309913624980866e-06, "epoch": 1.7694406548431105, "percentage": 59.29, "elapsed_time": "4:43:54", "remaining_time": "3:14:56"}
|
218 |
+
{"current_steps": 218, "total_steps": 366, "loss": 0.5562, "lr": 4.262658159845046e-06, "epoch": 1.7776261937244202, "percentage": 59.56, "elapsed_time": "4:45:09", "remaining_time": "3:13:35"}
|
219 |
+
{"current_steps": 219, "total_steps": 366, "loss": 0.5372, "lr": 4.2154699263217794e-06, "epoch": 1.78581173260573, "percentage": 59.84, "elapsed_time": "4:46:14", "remaining_time": "3:12:07"}
|
220 |
+
{"current_steps": 220, "total_steps": 366, "loss": 0.5242, "lr": 4.1683532270843505e-06, "epoch": 1.7939972714870396, "percentage": 60.11, "elapsed_time": "4:47:29", "remaining_time": "3:10:47"}
|
221 |
+
{"current_steps": 221, "total_steps": 366, "loss": 0.5593, "lr": 4.121312358283464e-06, "epoch": 1.8021828103683493, "percentage": 60.38, "elapsed_time": "4:48:56", "remaining_time": "3:09:34"}
|
222 |
+
{"current_steps": 222, "total_steps": 366, "loss": 0.5261, "lr": 4.074351609155527e-06, "epoch": 1.810368349249659, "percentage": 60.66, "elapsed_time": "4:50:07", "remaining_time": "3:08:11"}
|
223 |
+
{"current_steps": 223, "total_steps": 366, "loss": 0.5112, "lr": 4.0274752616315485e-06, "epoch": 1.8185538881309686, "percentage": 60.93, "elapsed_time": "4:51:27", "remaining_time": "3:06:54"}
|
224 |
+
{"current_steps": 224, "total_steps": 366, "loss": 0.5445, "lr": 3.980687589946715e-06, "epoch": 1.8267394270122783, "percentage": 61.2, "elapsed_time": "4:52:43", "remaining_time": "3:05:33"}
|
225 |
+
{"current_steps": 225, "total_steps": 366, "loss": 0.5305, "lr": 3.9339928602506505e-06, "epoch": 1.834924965893588, "percentage": 61.48, "elapsed_time": "4:54:13", "remaining_time": "3:04:22"}
|
226 |
+
{"current_steps": 226, "total_steps": 366, "loss": 0.4989, "lr": 3.887395330218429e-06, "epoch": 1.8431105047748977, "percentage": 61.75, "elapsed_time": "4:55:36", "remaining_time": "3:03:07"}
|
227 |
+
{"current_steps": 227, "total_steps": 366, "loss": 0.5445, "lr": 3.840899248662358e-06, "epoch": 1.8512960436562074, "percentage": 62.02, "elapsed_time": "4:56:42", "remaining_time": "3:01:41"}
|
228 |
+
{"current_steps": 228, "total_steps": 366, "loss": 0.5413, "lr": 3.7945088551445698e-06, "epoch": 1.859481582537517, "percentage": 62.3, "elapsed_time": "4:57:46", "remaining_time": "3:00:13"}
|
229 |
+
{"current_steps": 229, "total_steps": 366, "loss": 0.528, "lr": 3.748228379590438e-06, "epoch": 1.8676671214188267, "percentage": 62.57, "elapsed_time": "4:59:01", "remaining_time": "2:58:53"}
|
230 |
+
{"current_steps": 230, "total_steps": 366, "loss": 0.5079, "lr": 3.7020620419029095e-06, "epoch": 1.8758526603001364, "percentage": 62.84, "elapsed_time": "5:00:14", "remaining_time": "2:57:31"}
|
231 |
+
{"current_steps": 231, "total_steps": 366, "loss": 0.4863, "lr": 3.656014051577713e-06, "epoch": 1.884038199181446, "percentage": 63.11, "elapsed_time": "5:01:34", "remaining_time": "2:56:14"}
|
232 |
+
{"current_steps": 232, "total_steps": 366, "loss": 0.5311, "lr": 3.610088607319544e-06, "epoch": 1.8922237380627558, "percentage": 63.39, "elapsed_time": "5:02:51", "remaining_time": "2:54:55"}
|
233 |
+
{"current_steps": 233, "total_steps": 366, "loss": 0.5267, "lr": 3.5642898966592145e-06, "epoch": 1.9004092769440655, "percentage": 63.66, "elapsed_time": "5:03:52", "remaining_time": "2:53:27"}
|
234 |
+
{"current_steps": 234, "total_steps": 366, "loss": 0.5157, "lr": 3.518622095571831e-06, "epoch": 1.9085948158253752, "percentage": 63.93, "elapsed_time": "5:05:07", "remaining_time": "2:52:07"}
|
235 |
+
{"current_steps": 235, "total_steps": 366, "loss": 0.5167, "lr": 3.4730893680960267e-06, "epoch": 1.9167803547066848, "percentage": 64.21, "elapsed_time": "5:06:20", "remaining_time": "2:50:46"}
|
236 |
+
{"current_steps": 236, "total_steps": 366, "loss": 0.5032, "lr": 3.4276958659542838e-06, "epoch": 1.9249658935879945, "percentage": 64.48, "elapsed_time": "5:07:55", "remaining_time": "2:49:37"}
|
237 |
+
{"current_steps": 237, "total_steps": 366, "loss": 0.5354, "lr": 3.382445728174365e-06, "epoch": 1.9331514324693042, "percentage": 64.75, "elapsed_time": "5:09:07", "remaining_time": "2:48:15"}
|
238 |
+
{"current_steps": 238, "total_steps": 366, "loss": 0.5246, "lr": 3.3373430807119212e-06, "epoch": 1.941336971350614, "percentage": 65.03, "elapsed_time": "5:10:27", "remaining_time": "2:46:58"}
|
239 |
+
{"current_steps": 239, "total_steps": 366, "loss": 0.5572, "lr": 3.292392036074277e-06, "epoch": 1.9495225102319236, "percentage": 65.3, "elapsed_time": "5:11:32", "remaining_time": "2:45:32"}
|
240 |
+
{"current_steps": 240, "total_steps": 366, "loss": 0.525, "lr": 3.2475966929454505e-06, "epoch": 1.9577080491132333, "percentage": 65.57, "elapsed_time": "5:12:25", "remaining_time": "2:44:01"}
|
241 |
+
{"current_steps": 241, "total_steps": 366, "loss": 0.5047, "lr": 3.202961135812437e-06, "epoch": 1.965893587994543, "percentage": 65.85, "elapsed_time": "5:13:40", "remaining_time": "2:42:41"}
|
242 |
+
{"current_steps": 242, "total_steps": 366, "loss": 0.4997, "lr": 3.1584894345927663e-06, "epoch": 1.9740791268758526, "percentage": 66.12, "elapsed_time": "5:14:53", "remaining_time": "2:41:20"}
|
243 |
+
{"current_steps": 243, "total_steps": 366, "loss": 0.5359, "lr": 3.114185644263415e-06, "epoch": 1.9822646657571623, "percentage": 66.39, "elapsed_time": "5:16:29", "remaining_time": "2:40:11"}
|
244 |
+
{"current_steps": 244, "total_steps": 366, "loss": 0.5239, "lr": 3.0700538044910684e-06, "epoch": 1.990450204638472, "percentage": 66.67, "elapsed_time": "5:17:51", "remaining_time": "2:38:55"}
|
245 |
+
{"current_steps": 245, "total_steps": 366, "loss": 0.5093, "lr": 3.0260979392637753e-06, "epoch": 1.9986357435197817, "percentage": 66.94, "elapsed_time": "5:18:56", "remaining_time": "2:37:30"}
|
246 |
+
{"current_steps": 246, "total_steps": 366, "loss": 0.4999, "lr": 2.9823220565240396e-06, "epoch": 2.0, "percentage": 67.21, "elapsed_time": "5:19:10", "remaining_time": "2:35:41"}
|
247 |
+
{"current_steps": 247, "total_steps": 366, "loss": 0.4133, "lr": 2.9387301478033694e-06, "epoch": 2.00818553888131, "percentage": 67.49, "elapsed_time": "5:20:18", "remaining_time": "2:34:19"}
|
248 |
+
{"current_steps": 248, "total_steps": 366, "loss": 0.4113, "lr": 2.8953261878583263e-06, "epoch": 2.0163710777626194, "percentage": 67.76, "elapsed_time": "5:21:50", "remaining_time": "2:33:08"}
|
249 |
+
{"current_steps": 249, "total_steps": 366, "loss": 0.4277, "lr": 2.852114134308104e-06, "epoch": 2.0245566166439293, "percentage": 68.03, "elapsed_time": "5:22:54", "remaining_time": "2:31:43"}
|
250 |
+
{"current_steps": 250, "total_steps": 366, "loss": 0.4181, "lr": 2.8090979272736663e-06, "epoch": 2.0327421555252387, "percentage": 68.31, "elapsed_time": "5:24:16", "remaining_time": "2:30:27"}
|
251 |
+
{"current_steps": 251, "total_steps": 366, "loss": 0.414, "lr": 2.766281489018482e-06, "epoch": 2.0409276944065486, "percentage": 68.58, "elapsed_time": "5:25:25", "remaining_time": "2:29:05"}
|
252 |
+
{"current_steps": 252, "total_steps": 366, "loss": 0.4264, "lr": 2.7236687235908953e-06, "epoch": 2.049113233287858, "percentage": 68.85, "elapsed_time": "5:26:42", "remaining_time": "2:27:47"}
|
253 |
+
{"current_steps": 253, "total_steps": 366, "loss": 0.424, "lr": 2.681263516468139e-06, "epoch": 2.057298772169168, "percentage": 69.13, "elapsed_time": "5:28:24", "remaining_time": "2:26:40"}
|
254 |
+
{"current_steps": 254, "total_steps": 366, "loss": 0.418, "lr": 2.6390697342020665e-06, "epoch": 2.0654843110504775, "percentage": 69.4, "elapsed_time": "5:29:45", "remaining_time": "2:25:24"}
|
255 |
+
{"current_steps": 255, "total_steps": 366, "loss": 0.4351, "lr": 2.5970912240665815e-06, "epoch": 2.0736698499317874, "percentage": 69.67, "elapsed_time": "5:31:03", "remaining_time": "2:24:06"}
|
256 |
+
{"current_steps": 256, "total_steps": 366, "loss": 0.4047, "lr": 2.5553318137068473e-06, "epoch": 2.081855388813097, "percentage": 69.95, "elapsed_time": "5:32:23", "remaining_time": "2:22:49"}
|
257 |
+
{"current_steps": 257, "total_steps": 366, "loss": 0.4103, "lr": 2.5137953107902814e-06, "epoch": 2.0900409276944067, "percentage": 70.22, "elapsed_time": "5:33:42", "remaining_time": "2:21:32"}
|
258 |
+
{"current_steps": 258, "total_steps": 366, "loss": 0.4098, "lr": 2.472485502659358e-06, "epoch": 2.098226466575716, "percentage": 70.49, "elapsed_time": "5:34:59", "remaining_time": "2:20:13"}
|
259 |
+
{"current_steps": 259, "total_steps": 366, "loss": 0.3979, "lr": 2.4314061559862836e-06, "epoch": 2.106412005457026, "percentage": 70.77, "elapsed_time": "5:36:26", "remaining_time": "2:18:59"}
|
260 |
+
{"current_steps": 260, "total_steps": 366, "loss": 0.4001, "lr": 2.3905610164295394e-06, "epoch": 2.1145975443383356, "percentage": 71.04, "elapsed_time": "5:37:44", "remaining_time": "2:17:41"}
|
261 |
+
{"current_steps": 261, "total_steps": 366, "loss": 0.424, "lr": 2.3499538082923607e-06, "epoch": 2.1227830832196455, "percentage": 71.31, "elapsed_time": "5:39:00", "remaining_time": "2:16:22"}
|
262 |
+
{"current_steps": 262, "total_steps": 366, "loss": 0.4116, "lr": 2.309588234183137e-06, "epoch": 2.130968622100955, "percentage": 71.58, "elapsed_time": "5:40:45", "remaining_time": "2:15:15"}
|
263 |
+
{"current_steps": 263, "total_steps": 366, "loss": 0.3698, "lr": 2.2694679746778116e-06, "epoch": 2.139154160982265, "percentage": 71.86, "elapsed_time": "5:41:54", "remaining_time": "2:13:54"}
|
264 |
+
{"current_steps": 264, "total_steps": 366, "loss": 0.3919, "lr": 2.22959668798428e-06, "epoch": 2.1473396998635743, "percentage": 72.13, "elapsed_time": "5:43:16", "remaining_time": "2:12:37"}
|
265 |
+
{"current_steps": 265, "total_steps": 366, "loss": 0.407, "lr": 2.1899780096088375e-06, "epoch": 2.155525238744884, "percentage": 72.4, "elapsed_time": "5:44:38", "remaining_time": "2:11:21"}
|
266 |
+
{"current_steps": 266, "total_steps": 366, "loss": 0.4097, "lr": 2.1506155520246795e-06, "epoch": 2.1637107776261937, "percentage": 72.68, "elapsed_time": "5:45:56", "remaining_time": "2:10:03"}
|
267 |
+
{"current_steps": 267, "total_steps": 366, "loss": 0.4161, "lr": 2.1115129043425188e-06, "epoch": 2.1718963165075036, "percentage": 72.95, "elapsed_time": "5:47:13", "remaining_time": "2:08:44"}
|
268 |
+
{"current_steps": 268, "total_steps": 366, "loss": 0.3763, "lr": 2.072673631983323e-06, "epoch": 2.180081855388813, "percentage": 73.22, "elapsed_time": "5:48:26", "remaining_time": "2:07:25"}
|
269 |
+
{"current_steps": 269, "total_steps": 366, "loss": 0.379, "lr": 2.0341012763532243e-06, "epoch": 2.188267394270123, "percentage": 73.5, "elapsed_time": "5:49:32", "remaining_time": "2:06:02"}
|
270 |
+
{"current_steps": 270, "total_steps": 366, "loss": 0.3986, "lr": 1.995799354520598e-06, "epoch": 2.1964529331514324, "percentage": 73.77, "elapsed_time": "5:50:41", "remaining_time": "2:04:41"}
|
271 |
+
{"current_steps": 271, "total_steps": 366, "loss": 0.3874, "lr": 1.9577713588953797e-06, "epoch": 2.2046384720327423, "percentage": 74.04, "elapsed_time": "5:51:57", "remaining_time": "2:03:22"}
|
272 |
+
{"current_steps": 272, "total_steps": 366, "loss": 0.3946, "lr": 1.9200207569106216e-06, "epoch": 2.212824010914052, "percentage": 74.32, "elapsed_time": "5:53:11", "remaining_time": "2:02:03"}
|
273 |
+
{"current_steps": 273, "total_steps": 366, "loss": 0.4007, "lr": 1.8825509907063328e-06, "epoch": 2.2210095497953617, "percentage": 74.59, "elapsed_time": "5:54:18", "remaining_time": "2:00:41"}
|
274 |
+
{"current_steps": 274, "total_steps": 366, "loss": 0.4269, "lr": 1.8453654768156138e-06, "epoch": 2.229195088676671, "percentage": 74.86, "elapsed_time": "5:55:31", "remaining_time": "1:59:22"}
|
275 |
+
{"current_steps": 275, "total_steps": 366, "loss": 0.3932, "lr": 1.8084676058531376e-06, "epoch": 2.237380627557981, "percentage": 75.14, "elapsed_time": "5:56:55", "remaining_time": "1:58:06"}
|
276 |
+
{"current_steps": 276, "total_steps": 366, "loss": 0.4322, "lr": 1.771860742205988e-06, "epoch": 2.2455661664392905, "percentage": 75.41, "elapsed_time": "5:58:00", "remaining_time": "1:56:44"}
|
277 |
+
{"current_steps": 277, "total_steps": 366, "loss": 0.436, "lr": 1.7355482237268983e-06, "epoch": 2.2537517053206004, "percentage": 75.68, "elapsed_time": "5:59:13", "remaining_time": "1:55:25"}
|
278 |
+
{"current_steps": 278, "total_steps": 366, "loss": 0.4093, "lr": 1.6995333614298908e-06, "epoch": 2.26193724420191, "percentage": 75.96, "elapsed_time": "6:00:42", "remaining_time": "1:54:10"}
|
279 |
+
{"current_steps": 279, "total_steps": 366, "loss": 0.3858, "lr": 1.6638194391883822e-06, "epoch": 2.27012278308322, "percentage": 76.23, "elapsed_time": "6:02:02", "remaining_time": "1:52:53"}
|
280 |
+
{"current_steps": 280, "total_steps": 366, "loss": 0.3954, "lr": 1.6284097134357535e-06, "epoch": 2.2783083219645293, "percentage": 76.5, "elapsed_time": "6:03:26", "remaining_time": "1:51:37"}
|
281 |
+
{"current_steps": 281, "total_steps": 366, "loss": 0.4086, "lr": 1.5933074128684333e-06, "epoch": 2.286493860845839, "percentage": 76.78, "elapsed_time": "6:04:42", "remaining_time": "1:50:19"}
|
282 |
+
{"current_steps": 282, "total_steps": 366, "loss": 0.4159, "lr": 1.5585157381514875e-06, "epoch": 2.2946793997271486, "percentage": 77.05, "elapsed_time": "6:06:02", "remaining_time": "1:49:01"}
|
283 |
+
{"current_steps": 283, "total_steps": 366, "loss": 0.4176, "lr": 1.5240378616267887e-06, "epoch": 2.3028649386084585, "percentage": 77.32, "elapsed_time": "6:07:02", "remaining_time": "1:47:38"}
|
284 |
+
{"current_steps": 284, "total_steps": 366, "loss": 0.389, "lr": 1.4898769270237611e-06, "epoch": 2.311050477489768, "percentage": 77.6, "elapsed_time": "6:08:26", "remaining_time": "1:46:22"}
|
285 |
+
{"current_steps": 285, "total_steps": 366, "loss": 0.3908, "lr": 1.4560360491727233e-06, "epoch": 2.319236016371078, "percentage": 77.87, "elapsed_time": "6:09:36", "remaining_time": "1:45:02"}
|
286 |
+
{"current_steps": 286, "total_steps": 366, "loss": 0.4133, "lr": 1.4225183137208775e-06, "epoch": 2.3274215552523874, "percentage": 78.14, "elapsed_time": "6:10:59", "remaining_time": "1:43:46"}
|
287 |
+
{"current_steps": 287, "total_steps": 366, "loss": 0.4233, "lr": 1.389326776850966e-06, "epoch": 2.3356070941336973, "percentage": 78.42, "elapsed_time": "6:12:15", "remaining_time": "1:42:28"}
|
288 |
+
{"current_steps": 288, "total_steps": 366, "loss": 0.4123, "lr": 1.3564644650025894e-06, "epoch": 2.3437926330150067, "percentage": 78.69, "elapsed_time": "6:13:38", "remaining_time": "1:41:11"}
|
289 |
+
{"current_steps": 289, "total_steps": 366, "loss": 0.3924, "lr": 1.323934374596268e-06, "epoch": 2.3519781718963166, "percentage": 78.96, "elapsed_time": "6:15:01", "remaining_time": "1:39:55"}
|
290 |
+
{"current_steps": 290, "total_steps": 366, "loss": 0.3871, "lr": 1.2917394717602123e-06, "epoch": 2.360163710777626, "percentage": 79.23, "elapsed_time": "6:16:19", "remaining_time": "1:38:37"}
|
291 |
+
{"current_steps": 291, "total_steps": 366, "loss": 0.3864, "lr": 1.2598826920598773e-06, "epoch": 2.368349249658936, "percentage": 79.51, "elapsed_time": "6:17:51", "remaining_time": "1:37:23"}
|
292 |
+
{"current_steps": 292, "total_steps": 366, "loss": 0.4317, "lr": 1.2283669402302878e-06, "epoch": 2.3765347885402455, "percentage": 79.78, "elapsed_time": "6:19:13", "remaining_time": "1:36:06"}
|
293 |
+
{"current_steps": 293, "total_steps": 366, "loss": 0.3923, "lr": 1.197195089911191e-06, "epoch": 2.3847203274215554, "percentage": 80.05, "elapsed_time": "6:20:31", "remaining_time": "1:34:48"}
|
294 |
+
{"current_steps": 294, "total_steps": 366, "loss": 0.3893, "lr": 1.166369983385024e-06, "epoch": 2.392905866302865, "percentage": 80.33, "elapsed_time": "6:21:31", "remaining_time": "1:33:26"}
|
295 |
+
{"current_steps": 295, "total_steps": 366, "loss": 0.419, "lr": 1.1358944313177566e-06, "epoch": 2.4010914051841747, "percentage": 80.6, "elapsed_time": "6:22:42", "remaining_time": "1:32:06"}
|
296 |
+
{"current_steps": 296, "total_steps": 366, "loss": 0.4134, "lr": 1.1057712125026116e-06, "epoch": 2.409276944065484, "percentage": 80.87, "elapsed_time": "6:23:58", "remaining_time": "1:30:48"}
|
297 |
+
{"current_steps": 297, "total_steps": 366, "loss": 0.4299, "lr": 1.0760030736066952e-06, "epoch": 2.417462482946794, "percentage": 81.15, "elapsed_time": "6:25:25", "remaining_time": "1:29:32"}
|
298 |
+
{"current_steps": 298, "total_steps": 366, "loss": 0.3721, "lr": 1.0465927289205452e-06, "epoch": 2.4256480218281036, "percentage": 81.42, "elapsed_time": "6:26:40", "remaining_time": "1:28:14"}
|
299 |
+
{"current_steps": 299, "total_steps": 366, "loss": 0.4164, "lr": 1.0175428601106441e-06, "epoch": 2.4338335607094135, "percentage": 81.69, "elapsed_time": "6:27:53", "remaining_time": "1:26:55"}
|
300 |
+
{"current_steps": 300, "total_steps": 366, "loss": 0.3968, "lr": 9.888561159748995e-07, "epoch": 2.442019099590723, "percentage": 81.97, "elapsed_time": "6:29:14", "remaining_time": "1:25:37"}
|
301 |
+
{"current_steps": 301, "total_steps": 366, "loss": 0.417, "lr": 9.605351122011308e-07, "epoch": 2.450204638472033, "percentage": 82.24, "elapsed_time": "6:34:43", "remaining_time": "1:25:14"}
|
302 |
+
{"current_steps": 302, "total_steps": 366, "loss": 0.3973, "lr": 9.325824311285564e-07, "epoch": 2.4583901773533423, "percentage": 82.51, "elapsed_time": "6:35:39", "remaining_time": "1:23:50"}
|
303 |
+
{"current_steps": 303, "total_steps": 366, "loss": 0.4261, "lr": 9.050006215123419e-07, "epoch": 2.466575716234652, "percentage": 82.79, "elapsed_time": "6:36:56", "remaining_time": "1:22:31"}
|
304 |
+
{"current_steps": 304, "total_steps": 366, "loss": 0.4053, "lr": 8.777921982911996e-07, "epoch": 2.4747612551159617, "percentage": 83.06, "elapsed_time": "6:38:01", "remaining_time": "1:21:10"}
|