|
{"current_steps": 1, "total_steps": 69, "loss": 0.8402, "lr": 4.9974091841168195e-05, "epoch": 0.01444043321299639, "percentage": 1.45, "elapsed_time": "0:02:48", "remaining_time": "3:10:24", "throughput": 12482.16, "total_tokens": 2097152} |
|
{"current_steps": 2, "total_steps": 69, "loss": 0.7686, "lr": 4.9896421063288286e-05, "epoch": 0.02888086642599278, "percentage": 2.9, "elapsed_time": "0:05:26", "remaining_time": "3:02:12", "throughput": 12852.44, "total_tokens": 4194304} |
|
{"current_steps": 3, "total_steps": 69, "loss": 0.7563, "lr": 4.976714865090827e-05, "epoch": 0.04332129963898917, "percentage": 4.35, "elapsed_time": "0:08:04", "remaining_time": "2:57:42", "throughput": 12981.5, "total_tokens": 6291456} |
|
{"current_steps": 4, "total_steps": 69, "loss": 0.7139, "lr": 4.958654254084355e-05, "epoch": 0.05776173285198556, "percentage": 5.8, "elapsed_time": "0:10:42", "remaining_time": "2:54:02", "throughput": 13054.16, "total_tokens": 8388608} |
|
{"current_steps": 5, "total_steps": 69, "loss": 0.6793, "lr": 4.9354977066836986e-05, "epoch": 0.07220216606498195, "percentage": 7.25, "elapsed_time": "0:13:20", "remaining_time": "2:50:47", "throughput": 13098.17, "total_tokens": 10485760} |
|
{"current_steps": 6, "total_steps": 69, "loss": 0.6631, "lr": 4.907293218369499e-05, "epoch": 0.08664259927797834, "percentage": 8.7, "elapsed_time": "0:15:58", "remaining_time": "2:47:46", "throughput": 13124.77, "total_tokens": 12582912} |
|
{"current_steps": 7, "total_steps": 69, "loss": 0.64, "lr": 4.874099247250798e-05, "epoch": 0.10108303249097472, "percentage": 10.14, "elapsed_time": "0:18:36", "remaining_time": "2:44:52", "throughput": 13144.27, "total_tokens": 14680064} |
|
{"current_steps": 8, "total_steps": 69, "loss": 0.6145, "lr": 4.835984592901678e-05, "epoch": 0.11552346570397112, "percentage": 11.59, "elapsed_time": "0:21:14", "remaining_time": "2:42:01", "throughput": 13158.63, "total_tokens": 16777216} |
|
{"current_steps": 9, "total_steps": 69, "loss": 0.5997, "lr": 4.793028253763633e-05, "epoch": 0.1299638989169675, "percentage": 13.04, "elapsed_time": "0:23:52", "remaining_time": "2:39:11", "throughput": 13173.26, "total_tokens": 18874368} |
|
{"current_steps": 10, "total_steps": 69, "loss": 0.5896, "lr": 4.74531926340924e-05, "epoch": 0.1444043321299639, "percentage": 14.49, "elapsed_time": "0:26:30", "remaining_time": "2:36:25", "throughput": 13182.64, "total_tokens": 20971520} |
|
{"current_steps": 11, "total_steps": 69, "loss": 0.6025, "lr": 4.6929565060064864e-05, "epoch": 0.1588447653429603, "percentage": 15.94, "elapsed_time": "0:29:08", "remaining_time": "2:33:40", "throughput": 13191.88, "total_tokens": 23068672} |
|
{"current_steps": 12, "total_steps": 69, "loss": 0.5644, "lr": 4.6360485113662216e-05, "epoch": 0.17328519855595667, "percentage": 17.39, "elapsed_time": "0:31:46", "remaining_time": "2:30:57", "throughput": 13197.39, "total_tokens": 25165824} |
|
{"current_steps": 13, "total_steps": 69, "loss": 0.5558, "lr": 4.574713229997563e-05, "epoch": 0.18772563176895307, "percentage": 18.84, "elapsed_time": "0:34:24", "remaining_time": "2:28:14", "throughput": 13204.31, "total_tokens": 27262976} |
|
{"current_steps": 14, "total_steps": 69, "loss": 0.5705, "lr": 4.509077788637446e-05, "epoch": 0.20216606498194944, "percentage": 20.29, "elapsed_time": "0:37:02", "remaining_time": "2:25:32", "throughput": 13208.35, "total_tokens": 29360128} |
|
{"current_steps": 15, "total_steps": 69, "loss": 0.5694, "lr": 4.43927822676105e-05, "epoch": 0.21660649819494585, "percentage": 21.74, "elapsed_time": "0:39:40", "remaining_time": "2:22:51", "throughput": 13212.19, "total_tokens": 31457280} |
|
{"current_steps": 16, "total_steps": 69, "loss": 0.559, "lr": 4.365459214619214e-05, "epoch": 0.23104693140794225, "percentage": 23.19, "elapsed_time": "0:42:18", "remaining_time": "2:20:09", "throughput": 13217.11, "total_tokens": 33554432} |
|
{"current_steps": 17, "total_steps": 69, "loss": 0.5628, "lr": 4.2877737533872485e-05, "epoch": 0.24548736462093862, "percentage": 24.64, "elapsed_time": "0:44:56", "remaining_time": "2:17:28", "throughput": 13220.46, "total_tokens": 35651584} |
|
{"current_steps": 18, "total_steps": 69, "loss": 0.5553, "lr": 4.206382858046636e-05, "epoch": 0.259927797833935, "percentage": 26.09, "elapsed_time": "0:47:34", "remaining_time": "2:14:48", "throughput": 13223.11, "total_tokens": 37748736} |
|
{"current_steps": 19, "total_steps": 69, "loss": 0.5401, "lr": 4.12145522365689e-05, "epoch": 0.2743682310469314, "percentage": 27.54, "elapsed_time": "0:50:12", "remaining_time": "2:12:08", "throughput": 13225.48, "total_tokens": 39845888} |
|
{"current_steps": 20, "total_steps": 69, "loss": 0.575, "lr": 4.033166875709291e-05, "epoch": 0.2888086642599278, "percentage": 28.99, "elapsed_time": "0:52:51", "remaining_time": "2:09:29", "throughput": 13226.89, "total_tokens": 41943040} |
|
{"current_steps": 21, "total_steps": 69, "loss": 0.5398, "lr": 3.941700805287168e-05, "epoch": 0.30324909747292417, "percentage": 30.43, "elapsed_time": "0:55:29", "remaining_time": "2:06:49", "throughput": 13228.58, "total_tokens": 44040192} |
|
{"current_steps": 22, "total_steps": 69, "loss": 0.5389, "lr": 3.8472465897889394e-05, "epoch": 0.3176895306859206, "percentage": 31.88, "elapsed_time": "0:58:07", "remaining_time": "2:04:09", "throughput": 13231.1, "total_tokens": 46137344} |
|
{"current_steps": 23, "total_steps": 69, "loss": 0.5451, "lr": 3.7500000000000003e-05, "epoch": 0.33212996389891697, "percentage": 33.33, "elapsed_time": "1:00:44", "remaining_time": "2:01:29", "throughput": 13234.31, "total_tokens": 48234496} |
|
{"current_steps": 24, "total_steps": 69, "loss": 0.5558, "lr": 3.6501625943278805e-05, "epoch": 0.34657039711191334, "percentage": 34.78, "elapsed_time": "1:03:22", "remaining_time": "1:58:50", "throughput": 13235.05, "total_tokens": 50331648} |
|
{"current_steps": 25, "total_steps": 69, "loss": 0.5403, "lr": 3.547941301041661e-05, "epoch": 0.36101083032490977, "percentage": 36.23, "elapsed_time": "1:06:00", "remaining_time": "1:56:10", "throughput": 13238.0, "total_tokens": 52428800} |
|
{"current_steps": 26, "total_steps": 69, "loss": 0.5405, "lr": 3.443547989381536e-05, "epoch": 0.37545126353790614, "percentage": 37.68, "elapsed_time": "1:08:38", "remaining_time": "1:53:30", "throughput": 13240.74, "total_tokens": 54525952} |
|
{"current_steps": 27, "total_steps": 69, "loss": 0.5577, "lr": 3.3371990304274656e-05, "epoch": 0.3898916967509025, "percentage": 39.13, "elapsed_time": "1:11:15", "remaining_time": "1:50:51", "throughput": 13242.13, "total_tokens": 56623104} |
|
{"current_steps": 28, "total_steps": 69, "loss": 0.5345, "lr": 3.2291148486370626e-05, "epoch": 0.4043321299638989, "percentage": 40.58, "elapsed_time": "1:13:53", "remaining_time": "1:48:12", "throughput": 13243.46, "total_tokens": 58720256} |
|
{"current_steps": 29, "total_steps": 69, "loss": 0.5484, "lr": 3.11951946498225e-05, "epoch": 0.4187725631768953, "percentage": 42.03, "elapsed_time": "1:16:32", "remaining_time": "1:45:34", "throughput": 13243.76, "total_tokens": 60817408} |
|
{"current_steps": 30, "total_steps": 69, "loss": 0.5485, "lr": 3.008640032631585e-05, "epoch": 0.4332129963898917, "percentage": 43.48, "elapsed_time": "1:19:10", "remaining_time": "1:42:55", "throughput": 13245.01, "total_tokens": 62914560} |
|
{"current_steps": 31, "total_steps": 69, "loss": 0.5299, "lr": 2.8967063661406285e-05, "epoch": 0.44765342960288806, "percentage": 44.93, "elapsed_time": "1:21:48", "remaining_time": "1:40:16", "throughput": 13245.72, "total_tokens": 65011712} |
|
{"current_steps": 32, "total_steps": 69, "loss": 0.539, "lr": 2.7839504651261872e-05, "epoch": 0.4620938628158845, "percentage": 46.38, "elapsed_time": "1:24:26", "remaining_time": "1:37:37", "throughput": 13246.45, "total_tokens": 67108864} |
|
{"current_steps": 33, "total_steps": 69, "loss": 0.5248, "lr": 2.6706060334116777e-05, "epoch": 0.47653429602888087, "percentage": 47.83, "elapsed_time": "1:27:04", "remaining_time": "1:34:58", "throughput": 13247.54, "total_tokens": 69206016} |
|
{"current_steps": 34, "total_steps": 69, "loss": 0.5342, "lr": 2.556907994640264e-05, "epoch": 0.49097472924187724, "percentage": 49.28, "elapsed_time": "1:29:41", "remaining_time": "1:32:20", "throughput": 13248.46, "total_tokens": 71303168} |
|
{"current_steps": 35, "total_steps": 69, "loss": 0.5431, "lr": 2.4430920053597356e-05, "epoch": 0.5054151624548736, "percentage": 50.72, "elapsed_time": "1:32:19", "remaining_time": "1:29:41", "throughput": 13249.53, "total_tokens": 73400320} |
|
{"current_steps": 36, "total_steps": 69, "loss": 0.5471, "lr": 2.329393966588323e-05, "epoch": 0.51985559566787, "percentage": 52.17, "elapsed_time": "1:34:57", "remaining_time": "1:27:02", "throughput": 13250.51, "total_tokens": 75497472} |
|
{"current_steps": 37, "total_steps": 69, "loss": 0.542, "lr": 2.2160495348738123e-05, "epoch": 0.5342960288808665, "percentage": 53.62, "elapsed_time": "1:37:35", "remaining_time": "1:24:24", "throughput": 13251.85, "total_tokens": 77594624} |
|
{"current_steps": 38, "total_steps": 69, "loss": 0.542, "lr": 2.1032936338593718e-05, "epoch": 0.5487364620938628, "percentage": 55.07, "elapsed_time": "1:40:12", "remaining_time": "1:21:45", "throughput": 13253.57, "total_tokens": 79691776} |
|
{"current_steps": 39, "total_steps": 69, "loss": 0.542, "lr": 1.991359967368416e-05, "epoch": 0.5631768953068592, "percentage": 56.52, "elapsed_time": "1:42:50", "remaining_time": "1:19:06", "throughput": 13255.1, "total_tokens": 81788928} |
|
{"current_steps": 40, "total_steps": 69, "loss": 0.5425, "lr": 1.8804805350177505e-05, "epoch": 0.5776173285198556, "percentage": 57.97, "elapsed_time": "1:45:27", "remaining_time": "1:16:27", "throughput": 13256.36, "total_tokens": 83886080} |
|
{"current_steps": 41, "total_steps": 69, "loss": 0.5482, "lr": 1.7708851513629377e-05, "epoch": 0.592057761732852, "percentage": 59.42, "elapsed_time": "1:48:05", "remaining_time": "1:13:49", "throughput": 13257.04, "total_tokens": 85983232} |
|
{"current_steps": 42, "total_steps": 69, "loss": 0.5598, "lr": 1.6628009695725346e-05, "epoch": 0.6064981949458483, "percentage": 60.87, "elapsed_time": "1:50:43", "remaining_time": "1:11:10", "throughput": 13258.73, "total_tokens": 88080384} |
|
{"current_steps": 43, "total_steps": 69, "loss": 0.5402, "lr": 1.5564520106184644e-05, "epoch": 0.6209386281588448, "percentage": 62.32, "elapsed_time": "1:53:20", "remaining_time": "1:08:31", "throughput": 13260.29, "total_tokens": 90177536} |
|
{"current_steps": 44, "total_steps": 69, "loss": 0.5413, "lr": 1.4520586989583406e-05, "epoch": 0.6353790613718412, "percentage": 63.77, "elapsed_time": "1:55:58", "remaining_time": "1:05:53", "throughput": 13261.5, "total_tokens": 92274688} |
|
{"current_steps": 45, "total_steps": 69, "loss": 0.556, "lr": 1.3498374056721197e-05, "epoch": 0.6498194945848376, "percentage": 65.22, "elapsed_time": "1:58:35", "remaining_time": "1:03:15", "throughput": 13262.39, "total_tokens": 94371840} |
|
{"current_steps": 46, "total_steps": 69, "loss": 0.5341, "lr": 1.2500000000000006e-05, "epoch": 0.6642599277978339, "percentage": 66.67, "elapsed_time": "2:01:13", "remaining_time": "1:00:36", "throughput": 13263.23, "total_tokens": 96468992} |
|
{"current_steps": 47, "total_steps": 69, "loss": 0.5436, "lr": 1.1527534102110612e-05, "epoch": 0.6787003610108303, "percentage": 68.12, "elapsed_time": "2:03:51", "remaining_time": "0:57:58", "throughput": 13264.02, "total_tokens": 98566144} |
|
{"current_steps": 48, "total_steps": 69, "loss": 0.5393, "lr": 1.0582991947128324e-05, "epoch": 0.6931407942238267, "percentage": 69.57, "elapsed_time": "2:06:28", "remaining_time": "0:55:20", "throughput": 13264.84, "total_tokens": 100663296} |
|
{"current_steps": 49, "total_steps": 69, "loss": 0.5598, "lr": 9.668331242907089e-06, "epoch": 0.7075812274368231, "percentage": 71.01, "elapsed_time": "2:09:06", "remaining_time": "0:52:41", "throughput": 13265.65, "total_tokens": 102760448} |
|
{"current_steps": 50, "total_steps": 69, "loss": 0.5329, "lr": 8.785447763431101e-06, "epoch": 0.7220216606498195, "percentage": 72.46, "elapsed_time": "2:11:44", "remaining_time": "0:50:03", "throughput": 13265.87, "total_tokens": 104857600} |
|
{"current_steps": 51, "total_steps": 69, "loss": 0.5384, "lr": 7.936171419533653e-06, "epoch": 0.7364620938628159, "percentage": 73.91, "elapsed_time": "2:14:21", "remaining_time": "0:47:25", "throughput": 13266.73, "total_tokens": 106954752} |
|
{"current_steps": 52, "total_steps": 69, "loss": 0.5447, "lr": 7.122262466127514e-06, "epoch": 0.7509025270758123, "percentage": 75.36, "elapsed_time": "2:16:59", "remaining_time": "0:44:47", "throughput": 13267.67, "total_tokens": 109051904} |
|
{"current_steps": 53, "total_steps": 69, "loss": 0.5291, "lr": 6.3454078538078635e-06, "epoch": 0.7653429602888087, "percentage": 76.81, "elapsed_time": "2:19:37", "remaining_time": "0:42:08", "throughput": 13268.2, "total_tokens": 111149056} |
|
{"current_steps": 54, "total_steps": 69, "loss": 0.5258, "lr": 5.607217732389503e-06, "epoch": 0.779783393501805, "percentage": 78.26, "elapsed_time": "2:22:14", "remaining_time": "0:39:30", "throughput": 13269.48, "total_tokens": 113246208} |
|
{"current_steps": 55, "total_steps": 69, "loss": 0.5508, "lr": 4.9092221136255444e-06, "epoch": 0.7942238267148014, "percentage": 79.71, "elapsed_time": "2:24:51", "remaining_time": "0:36:52", "throughput": 13270.12, "total_tokens": 115343360} |
|
{"current_steps": 56, "total_steps": 69, "loss": 0.5439, "lr": 4.252867700024374e-06, "epoch": 0.8086642599277978, "percentage": 81.16, "elapsed_time": "2:27:29", "remaining_time": "0:34:14", "throughput": 13270.24, "total_tokens": 117440512} |
|
{"current_steps": 57, "total_steps": 69, "loss": 0.5261, "lr": 3.6395148863377858e-06, "epoch": 0.8231046931407943, "percentage": 82.61, "elapsed_time": "2:30:08", "remaining_time": "0:31:36", "throughput": 13270.03, "total_tokens": 119537664} |
|
{"current_steps": 58, "total_steps": 69, "loss": 0.5518, "lr": 3.0704349399351435e-06, "epoch": 0.8375451263537906, "percentage": 84.06, "elapsed_time": "2:32:45", "remaining_time": "0:28:58", "throughput": 13270.36, "total_tokens": 121634816} |
|
{"current_steps": 59, "total_steps": 69, "loss": 0.5444, "lr": 2.5468073659076e-06, "epoch": 0.851985559566787, "percentage": 85.51, "elapsed_time": "2:35:23", "remaining_time": "0:26:20", "throughput": 13270.7, "total_tokens": 123731968} |
|
{"current_steps": 60, "total_steps": 69, "loss": 0.5469, "lr": 2.0697174623636794e-06, "epoch": 0.8664259927797834, "percentage": 86.96, "elapsed_time": "2:38:01", "remaining_time": "0:23:42", "throughput": 13270.96, "total_tokens": 125829120} |
|
{"current_steps": 61, "total_steps": 69, "loss": 0.5335, "lr": 1.6401540709832242e-06, "epoch": 0.8808664259927798, "percentage": 88.41, "elapsed_time": "2:40:39", "remaining_time": "0:21:04", "throughput": 13271.26, "total_tokens": 127926272} |
|
{"current_steps": 62, "total_steps": 69, "loss": 0.5367, "lr": 1.2590075274920205e-06, "epoch": 0.8953068592057761, "percentage": 89.86, "elapsed_time": "2:43:16", "remaining_time": "0:18:26", "throughput": 13272.14, "total_tokens": 130023424} |
|
{"current_steps": 63, "total_steps": 69, "loss": 0.551, "lr": 9.270678163050217e-07, "epoch": 0.9097472924187726, "percentage": 91.3, "elapsed_time": "2:45:54", "remaining_time": "0:15:48", "throughput": 13272.46, "total_tokens": 132120576} |
|
{"current_steps": 64, "total_steps": 69, "loss": 0.5597, "lr": 6.450229331630253e-07, "epoch": 0.924187725631769, "percentage": 92.75, "elapsed_time": "2:48:32", "remaining_time": "0:13:10", "throughput": 13272.79, "total_tokens": 134217728} |
|
{"current_steps": 65, "total_steps": 69, "loss": 0.5369, "lr": 4.134574591564494e-07, "epoch": 0.9386281588447654, "percentage": 94.2, "elapsed_time": "2:51:09", "remaining_time": "0:10:31", "throughput": 13273.81, "total_tokens": 136314880} |
|
{"current_steps": 66, "total_steps": 69, "loss": 0.5451, "lr": 2.3285134909173112e-07, "epoch": 0.9530685920577617, "percentage": 95.65, "elapsed_time": "2:53:45", "remaining_time": "0:07:53", "throughput": 13276.09, "total_tokens": 138412032} |
|
{"current_steps": 67, "total_steps": 69, "loss": 0.5237, "lr": 1.0357893671171792e-07, "epoch": 0.9675090252707581, "percentage": 97.1, "elapsed_time": "2:56:20", "remaining_time": "0:05:15", "throughput": 13279.42, "total_tokens": 140509184} |
|
{"current_steps": 68, "total_steps": 69, "loss": 0.5604, "lr": 2.590815883181108e-08, "epoch": 0.9819494584837545, "percentage": 98.55, "elapsed_time": "2:58:55", "remaining_time": "0:02:37", "throughput": 13283.18, "total_tokens": 142606336} |
|
{"current_steps": 69, "total_steps": 69, "loss": 0.534, "lr": 0.0, "epoch": 0.9963898916967509, "percentage": 100.0, "elapsed_time": "3:01:30", "remaining_time": "0:00:00", "throughput": 13286.8, "total_tokens": 144703488} |
|
{"current_steps": 69, "total_steps": 69, "epoch": 0.9963898916967509, "percentage": 100.0, "elapsed_time": "3:01:52", "remaining_time": "0:00:00", "throughput": 13260.92, "total_tokens": 144703488} |
|
|