|
{"current_steps": 10, "total_steps": 3255, "loss": 1.3982, "lr": 3.067484662576687e-06, "epoch": 0.01535213970447131, "percentage": 0.31, "elapsed_time": "0:01:26", "remaining_time": "7:48:20"} |
|
{"current_steps": 20, "total_steps": 3255, "loss": 1.1812, "lr": 6.134969325153374e-06, "epoch": 0.03070427940894262, "percentage": 0.61, "elapsed_time": "0:02:55", "remaining_time": "7:53:35"} |
|
{"current_steps": 30, "total_steps": 3255, "loss": 1.2206, "lr": 9.202453987730062e-06, "epoch": 0.04605641911341393, "percentage": 0.92, "elapsed_time": "0:04:24", "remaining_time": "7:54:43"} |
|
{"current_steps": 40, "total_steps": 3255, "loss": 0.801, "lr": 1.2269938650306748e-05, "epoch": 0.06140855881788524, "percentage": 1.23, "elapsed_time": "0:05:54", "remaining_time": "7:54:51"} |
|
{"current_steps": 50, "total_steps": 3255, "loss": 0.5046, "lr": 1.5337423312883436e-05, "epoch": 0.07676069852235655, "percentage": 1.54, "elapsed_time": "0:07:23", "remaining_time": "7:53:56"} |
|
{"current_steps": 50, "total_steps": 3255, "eval_loss": 0.30626675486564636, "epoch": 0.07676069852235655, "percentage": 1.54, "elapsed_time": "0:10:29", "remaining_time": "11:12:42"} |
|
{"current_steps": 60, "total_steps": 3255, "loss": 0.2991, "lr": 1.8404907975460123e-05, "epoch": 0.09211283822682786, "percentage": 1.84, "elapsed_time": "0:12:01", "remaining_time": "10:40:44"} |
|
{"current_steps": 70, "total_steps": 3255, "loss": 0.2284, "lr": 2.1472392638036813e-05, "epoch": 0.10746497793129918, "percentage": 2.15, "elapsed_time": "0:13:31", "remaining_time": "10:15:09"} |
|
{"current_steps": 80, "total_steps": 3255, "loss": 0.1355, "lr": 2.4539877300613496e-05, "epoch": 0.12281711763577048, "percentage": 2.46, "elapsed_time": "0:15:00", "remaining_time": "9:55:18"} |
|
{"current_steps": 90, "total_steps": 3255, "loss": 0.1286, "lr": 2.7607361963190186e-05, "epoch": 0.1381692573402418, "percentage": 2.76, "elapsed_time": "0:16:28", "remaining_time": "9:39:27"} |
|
{"current_steps": 100, "total_steps": 3255, "loss": 0.1059, "lr": 3.067484662576687e-05, "epoch": 0.1535213970447131, "percentage": 3.07, "elapsed_time": "0:17:57", "remaining_time": "9:26:36"} |
|
{"current_steps": 100, "total_steps": 3255, "eval_loss": 0.08417145907878876, "epoch": 0.1535213970447131, "percentage": 3.07, "elapsed_time": "0:21:02", "remaining_time": "11:03:55"} |
|
{"current_steps": 110, "total_steps": 3255, "loss": 0.0726, "lr": 3.3742331288343556e-05, "epoch": 0.16887353674918443, "percentage": 3.38, "elapsed_time": "0:22:34", "remaining_time": "10:45:26"} |
|
{"current_steps": 120, "total_steps": 3255, "loss": 0.0767, "lr": 3.6809815950920246e-05, "epoch": 0.18422567645365573, "percentage": 3.69, "elapsed_time": "0:24:03", "remaining_time": "10:28:26"} |
|
{"current_steps": 130, "total_steps": 3255, "loss": 0.0823, "lr": 3.987730061349693e-05, "epoch": 0.19957781615812703, "percentage": 3.99, "elapsed_time": "0:25:32", "remaining_time": "10:13:49"} |
|
{"current_steps": 140, "total_steps": 3255, "loss": 0.0574, "lr": 4.2944785276073626e-05, "epoch": 0.21492995586259836, "percentage": 4.3, "elapsed_time": "0:27:00", "remaining_time": "10:00:53"} |
|
{"current_steps": 150, "total_steps": 3255, "loss": 0.0783, "lr": 4.601226993865031e-05, "epoch": 0.23028209556706966, "percentage": 4.61, "elapsed_time": "0:28:29", "remaining_time": "9:49:39"} |
|
{"current_steps": 150, "total_steps": 3255, "eval_loss": 0.06952261179685593, "epoch": 0.23028209556706966, "percentage": 4.61, "elapsed_time": "0:31:34", "remaining_time": "10:53:36"} |
|
{"current_steps": 160, "total_steps": 3255, "loss": 0.0974, "lr": 4.907975460122699e-05, "epoch": 0.24563423527154096, "percentage": 4.92, "elapsed_time": "0:33:06", "remaining_time": "10:40:27"} |
|
{"current_steps": 170, "total_steps": 3255, "loss": 0.0751, "lr": 5.214723926380368e-05, "epoch": 0.2609863749760123, "percentage": 5.22, "elapsed_time": "0:34:35", "remaining_time": "10:27:46"} |
|
{"current_steps": 180, "total_steps": 3255, "loss": 0.0761, "lr": 5.521472392638037e-05, "epoch": 0.2763385146804836, "percentage": 5.53, "elapsed_time": "0:36:04", "remaining_time": "10:16:10"} |
|
{"current_steps": 190, "total_steps": 3255, "loss": 0.0629, "lr": 5.8282208588957056e-05, "epoch": 0.2916906543849549, "percentage": 5.84, "elapsed_time": "0:37:32", "remaining_time": "10:05:44"} |
|
{"current_steps": 200, "total_steps": 3255, "loss": 0.0635, "lr": 6.134969325153375e-05, "epoch": 0.3070427940894262, "percentage": 6.14, "elapsed_time": "0:39:02", "remaining_time": "9:56:15"} |
|
{"current_steps": 200, "total_steps": 3255, "eval_loss": 0.05947184935212135, "epoch": 0.3070427940894262, "percentage": 6.14, "elapsed_time": "0:42:07", "remaining_time": "10:43:23"} |
|
{"current_steps": 210, "total_steps": 3255, "loss": 0.06, "lr": 6.441717791411042e-05, "epoch": 0.3223949337938975, "percentage": 6.45, "elapsed_time": "0:43:39", "remaining_time": "10:32:55"} |
|
{"current_steps": 220, "total_steps": 3255, "loss": 0.0491, "lr": 6.748466257668711e-05, "epoch": 0.33774707349836885, "percentage": 6.76, "elapsed_time": "0:45:07", "remaining_time": "10:22:30"} |
|
{"current_steps": 230, "total_steps": 3255, "loss": 0.0828, "lr": 7.055214723926382e-05, "epoch": 0.35309921320284016, "percentage": 7.07, "elapsed_time": "0:46:36", "remaining_time": "10:12:56"} |
|
{"current_steps": 240, "total_steps": 3255, "loss": 0.0633, "lr": 7.361963190184049e-05, "epoch": 0.36845135290731146, "percentage": 7.37, "elapsed_time": "0:48:05", "remaining_time": "10:04:03"} |
|
{"current_steps": 250, "total_steps": 3255, "loss": 0.075, "lr": 7.668711656441718e-05, "epoch": 0.38380349261178276, "percentage": 7.68, "elapsed_time": "0:49:33", "remaining_time": "9:55:46"} |
|
{"current_steps": 250, "total_steps": 3255, "eval_loss": 0.053019050508737564, "epoch": 0.38380349261178276, "percentage": 7.68, "elapsed_time": "0:52:38", "remaining_time": "10:32:47"} |
|
{"current_steps": 260, "total_steps": 3255, "loss": 0.0613, "lr": 7.975460122699386e-05, "epoch": 0.39915563231625406, "percentage": 7.99, "elapsed_time": "0:54:10", "remaining_time": "10:24:02"} |
|
{"current_steps": 270, "total_steps": 3255, "loss": 0.0652, "lr": 8.282208588957055e-05, "epoch": 0.41450777202072536, "percentage": 8.29, "elapsed_time": "0:55:39", "remaining_time": "10:15:19"} |
|
{"current_steps": 280, "total_steps": 3255, "loss": 0.0692, "lr": 8.588957055214725e-05, "epoch": 0.4298599117251967, "percentage": 8.6, "elapsed_time": "0:57:08", "remaining_time": "10:07:04"} |
|
{"current_steps": 290, "total_steps": 3255, "loss": 0.051, "lr": 8.895705521472393e-05, "epoch": 0.445212051429668, "percentage": 8.91, "elapsed_time": "0:58:37", "remaining_time": "9:59:22"} |
|
{"current_steps": 300, "total_steps": 3255, "loss": 0.065, "lr": 9.202453987730062e-05, "epoch": 0.4605641911341393, "percentage": 9.22, "elapsed_time": "1:00:05", "remaining_time": "9:51:58"} |
|
{"current_steps": 300, "total_steps": 3255, "eval_loss": 0.0490945465862751, "epoch": 0.4605641911341393, "percentage": 9.22, "elapsed_time": "1:03:09", "remaining_time": "10:22:09"} |
|
{"current_steps": 310, "total_steps": 3255, "loss": 0.0461, "lr": 9.50920245398773e-05, "epoch": 0.4759163308386106, "percentage": 9.52, "elapsed_time": "1:04:41", "remaining_time": "10:14:38"} |
|
{"current_steps": 320, "total_steps": 3255, "loss": 0.0471, "lr": 9.815950920245399e-05, "epoch": 0.4912684705430819, "percentage": 9.83, "elapsed_time": "1:06:10", "remaining_time": "10:06:55"} |
|
{"current_steps": 330, "total_steps": 3255, "loss": 0.0541, "lr": 9.999953982785432e-05, "epoch": 0.5066206102475532, "percentage": 10.14, "elapsed_time": "1:07:38", "remaining_time": "9:59:34"} |
|
{"current_steps": 340, "total_steps": 3255, "loss": 0.0474, "lr": 9.999436298849151e-05, "epoch": 0.5219727499520246, "percentage": 10.45, "elapsed_time": "1:09:07", "remaining_time": "9:52:40"} |
|
{"current_steps": 350, "total_steps": 3255, "loss": 0.0474, "lr": 9.998343469212352e-05, "epoch": 0.5373248896564958, "percentage": 10.75, "elapsed_time": "1:10:35", "remaining_time": "9:45:56"} |
|
{"current_steps": 350, "total_steps": 3255, "eval_loss": 0.04777354747056961, "epoch": 0.5373248896564958, "percentage": 10.75, "elapsed_time": "1:13:40", "remaining_time": "10:11:26"} |
|
{"current_steps": 360, "total_steps": 3255, "loss": 0.047, "lr": 9.996675619596465e-05, "epoch": 0.5526770293609672, "percentage": 11.06, "elapsed_time": "1:15:12", "remaining_time": "10:04:47"} |
|
{"current_steps": 370, "total_steps": 3255, "loss": 0.0571, "lr": 9.99443294187443e-05, "epoch": 0.5680291690654385, "percentage": 11.37, "elapsed_time": "1:16:40", "remaining_time": "9:57:54"} |
|
{"current_steps": 380, "total_steps": 3255, "loss": 0.0483, "lr": 9.991615694048621e-05, "epoch": 0.5833813087699098, "percentage": 11.67, "elapsed_time": "1:18:09", "remaining_time": "9:51:19"} |
|
{"current_steps": 390, "total_steps": 3255, "loss": 0.057, "lr": 9.988224200221172e-05, "epoch": 0.5987334484743811, "percentage": 11.98, "elapsed_time": "1:19:37", "remaining_time": "9:44:59"} |
|
{"current_steps": 400, "total_steps": 3255, "loss": 0.0461, "lr": 9.984258850556693e-05, "epoch": 0.6140855881788524, "percentage": 12.29, "elapsed_time": "1:21:06", "remaining_time": "9:38:56"} |
|
{"current_steps": 400, "total_steps": 3255, "eval_loss": 0.04933024197816849, "epoch": 0.6140855881788524, "percentage": 12.29, "elapsed_time": "1:24:11", "remaining_time": "10:00:54"} |
|
{"current_steps": 410, "total_steps": 3255, "loss": 0.0434, "lr": 9.979720101237375e-05, "epoch": 0.6294377278833237, "percentage": 12.6, "elapsed_time": "1:25:43", "remaining_time": "9:54:53"} |
|
{"current_steps": 420, "total_steps": 3255, "loss": 0.0511, "lr": 9.974608474410512e-05, "epoch": 0.644789867587795, "percentage": 12.9, "elapsed_time": "1:27:12", "remaining_time": "9:48:42"} |
|
{"current_steps": 430, "total_steps": 3255, "loss": 0.0506, "lr": 9.968924558128445e-05, "epoch": 0.6601420072922664, "percentage": 13.21, "elapsed_time": "1:28:41", "remaining_time": "9:42:41"} |
|
{"current_steps": 440, "total_steps": 3255, "loss": 0.0421, "lr": 9.962669006280894e-05, "epoch": 0.6754941469967377, "percentage": 13.52, "elapsed_time": "1:30:09", "remaining_time": "9:36:48"} |
|
{"current_steps": 450, "total_steps": 3255, "loss": 0.0533, "lr": 9.95584253851974e-05, "epoch": 0.690846286701209, "percentage": 13.82, "elapsed_time": "1:31:37", "remaining_time": "9:31:10"} |
|
{"current_steps": 450, "total_steps": 3255, "eval_loss": 0.053962595760822296, "epoch": 0.690846286701209, "percentage": 13.82, "elapsed_time": "1:34:42", "remaining_time": "9:50:20"} |
|
{"current_steps": 460, "total_steps": 3255, "loss": 0.0548, "lr": 9.948445940176243e-05, "epoch": 0.7061984264056803, "percentage": 14.13, "elapsed_time": "1:36:17", "remaining_time": "9:45:02"} |
|
{"current_steps": 470, "total_steps": 3255, "loss": 0.0433, "lr": 9.940480062170679e-05, "epoch": 0.7215505661101516, "percentage": 14.44, "elapsed_time": "1:37:45", "remaining_time": "9:39:16"} |
|
{"current_steps": 480, "total_steps": 3255, "loss": 0.0538, "lr": 9.931945820914462e-05, "epoch": 0.7369027058146229, "percentage": 14.75, "elapsed_time": "1:39:13", "remaining_time": "9:33:40"} |
|
{"current_steps": 490, "total_steps": 3255, "loss": 0.0429, "lr": 9.922844198204715e-05, "epoch": 0.7522548455190943, "percentage": 15.05, "elapsed_time": "1:40:42", "remaining_time": "9:28:15"} |
|
{"current_steps": 500, "total_steps": 3255, "loss": 0.048, "lr": 9.913176241111319e-05, "epoch": 0.7676069852235655, "percentage": 15.36, "elapsed_time": "1:42:10", "remaining_time": "9:23:00"} |
|
{"current_steps": 500, "total_steps": 3255, "eval_loss": 0.045701391994953156, "epoch": 0.7676069852235655, "percentage": 15.36, "elapsed_time": "1:45:15", "remaining_time": "9:39:56"} |
|
{"current_steps": 510, "total_steps": 3255, "loss": 0.0381, "lr": 9.902943061856456e-05, "epoch": 0.7829591249280369, "percentage": 15.67, "elapsed_time": "1:46:47", "remaining_time": "9:34:46"} |
|
{"current_steps": 520, "total_steps": 3255, "loss": 0.0628, "lr": 9.892145837686657e-05, "epoch": 0.7983112646325081, "percentage": 15.98, "elapsed_time": "1:48:15", "remaining_time": "9:29:22"} |
|
{"current_steps": 530, "total_steps": 3255, "loss": 0.0577, "lr": 9.880785810737378e-05, "epoch": 0.8136634043369795, "percentage": 16.28, "elapsed_time": "1:49:43", "remaining_time": "9:24:10"} |
|
{"current_steps": 540, "total_steps": 3255, "loss": 0.0442, "lr": 9.868864287890083e-05, "epoch": 0.8290155440414507, "percentage": 16.59, "elapsed_time": "1:51:10", "remaining_time": "9:18:58"} |
|
{"current_steps": 550, "total_steps": 3255, "loss": 0.0694, "lr": 9.856382640621917e-05, "epoch": 0.8443676837459221, "percentage": 16.9, "elapsed_time": "1:52:38", "remaining_time": "9:14:01"} |
|
{"current_steps": 550, "total_steps": 3255, "eval_loss": 0.047504179179668427, "epoch": 0.8443676837459221, "percentage": 16.9, "elapsed_time": "1:55:38", "remaining_time": "9:28:43"} |
|
{"current_steps": 560, "total_steps": 3255, "loss": 0.0381, "lr": 9.84334230484792e-05, "epoch": 0.8597198234503934, "percentage": 17.2, "elapsed_time": "1:57:09", "remaining_time": "9:23:48"} |
|
{"current_steps": 570, "total_steps": 3255, "loss": 0.044, "lr": 9.82974478075583e-05, "epoch": 0.8750719631548647, "percentage": 17.51, "elapsed_time": "1:58:37", "remaining_time": "9:18:44"} |
|
{"current_steps": 580, "total_steps": 3255, "loss": 0.0388, "lr": 9.815591632633509e-05, "epoch": 0.890424102859336, "percentage": 17.82, "elapsed_time": "2:00:04", "remaining_time": "9:13:46"} |
|
{"current_steps": 590, "total_steps": 3255, "loss": 0.044, "lr": 9.800884488688985e-05, "epoch": 0.9057762425638073, "percentage": 18.13, "elapsed_time": "2:01:32", "remaining_time": "9:08:58"} |
|
{"current_steps": 600, "total_steps": 3255, "loss": 0.0396, "lr": 9.785625040863124e-05, "epoch": 0.9211283822682786, "percentage": 18.43, "elapsed_time": "2:02:59", "remaining_time": "9:04:14"} |
|
{"current_steps": 600, "total_steps": 3255, "eval_loss": 0.04156533628702164, "epoch": 0.9211283822682786, "percentage": 18.43, "elapsed_time": "2:06:03", "remaining_time": "9:17:46"} |
|
{"current_steps": 610, "total_steps": 3255, "loss": 0.036, "lr": 9.769815044635005e-05, "epoch": 0.93648052197275, "percentage": 18.74, "elapsed_time": "2:07:34", "remaining_time": "9:13:11"} |
|
{"current_steps": 620, "total_steps": 3255, "loss": 0.0463, "lr": 9.753456318819946e-05, "epoch": 0.9518326616772212, "percentage": 19.05, "elapsed_time": "2:09:02", "remaining_time": "9:08:27"} |
|
{"current_steps": 630, "total_steps": 3255, "loss": 0.0425, "lr": 9.736550745360292e-05, "epoch": 0.9671848013816926, "percentage": 19.35, "elapsed_time": "2:10:30", "remaining_time": "9:03:48"} |
|
{"current_steps": 640, "total_steps": 3255, "loss": 0.043, "lr": 9.719100269108872e-05, "epoch": 0.9825369410861639, "percentage": 19.66, "elapsed_time": "2:11:59", "remaining_time": "8:59:17"} |
|
{"current_steps": 650, "total_steps": 3255, "loss": 0.0412, "lr": 9.701106897605304e-05, "epoch": 0.9978890807906352, "percentage": 19.97, "elapsed_time": "2:13:27", "remaining_time": "8:54:49"} |
|
{"current_steps": 650, "total_steps": 3255, "eval_loss": 0.03858696296811104, "epoch": 0.9978890807906352, "percentage": 19.97, "elapsed_time": "2:16:30", "remaining_time": "9:07:05"} |
|
{"current_steps": 660, "total_steps": 3255, "loss": 0.0308, "lr": 9.682572700845006e-05, "epoch": 1.0132412204951065, "percentage": 20.28, "elapsed_time": "2:18:02", "remaining_time": "9:02:44"} |
|
{"current_steps": 670, "total_steps": 3255, "loss": 0.0335, "lr": 9.663499811041082e-05, "epoch": 1.0285933601995778, "percentage": 20.58, "elapsed_time": "2:19:30", "remaining_time": "8:58:14"} |
|
{"current_steps": 680, "total_steps": 3255, "loss": 0.0363, "lr": 9.643890422379018e-05, "epoch": 1.0439454999040492, "percentage": 20.89, "elapsed_time": "2:20:58", "remaining_time": "8:53:50"} |
|
{"current_steps": 690, "total_steps": 3255, "loss": 0.0306, "lr": 9.623746790764261e-05, "epoch": 1.0592976396085205, "percentage": 21.2, "elapsed_time": "2:22:26", "remaining_time": "8:49:31"} |
|
{"current_steps": 700, "total_steps": 3255, "loss": 0.0339, "lr": 9.603071233562695e-05, "epoch": 1.0746497793129917, "percentage": 21.51, "elapsed_time": "2:23:54", "remaining_time": "8:45:17"} |
|
{"current_steps": 700, "total_steps": 3255, "eval_loss": 0.04569621756672859, "epoch": 1.0746497793129917, "percentage": 21.51, "elapsed_time": "2:26:59", "remaining_time": "8:56:29"} |
|
{"current_steps": 710, "total_steps": 3255, "loss": 0.0407, "lr": 9.581866129334044e-05, "epoch": 1.090001919017463, "percentage": 21.81, "elapsed_time": "2:28:30", "remaining_time": "8:52:21"} |
|
{"current_steps": 720, "total_steps": 3255, "loss": 0.0452, "lr": 9.560133917558242e-05, "epoch": 1.1053540587219344, "percentage": 22.12, "elapsed_time": "2:29:59", "remaining_time": "8:48:05"} |
|
{"current_steps": 730, "total_steps": 3255, "loss": 0.0334, "lr": 9.537877098354786e-05, "epoch": 1.1207061984264057, "percentage": 22.43, "elapsed_time": "2:31:28", "remaining_time": "8:43:54"} |
|
{"current_steps": 740, "total_steps": 3255, "loss": 0.0274, "lr": 9.51509823219512e-05, "epoch": 1.136058338130877, "percentage": 22.73, "elapsed_time": "2:32:56", "remaining_time": "8:39:46"} |
|
{"current_steps": 750, "total_steps": 3255, "loss": 0.0357, "lr": 9.491799939608065e-05, "epoch": 1.1514104778353482, "percentage": 23.04, "elapsed_time": "2:34:24", "remaining_time": "8:35:43"} |
|
{"current_steps": 750, "total_steps": 3255, "eval_loss": 0.04340927302837372, "epoch": 1.1514104778353482, "percentage": 23.04, "elapsed_time": "2:37:28", "remaining_time": "8:45:57"} |
|
{"current_steps": 760, "total_steps": 3255, "loss": 0.0303, "lr": 9.467984900878364e-05, "epoch": 1.1667626175398196, "percentage": 23.35, "elapsed_time": "2:38:59", "remaining_time": "8:41:58"} |
|
{"current_steps": 770, "total_steps": 3255, "loss": 0.0269, "lr": 9.443655855738321e-05, "epoch": 1.182114757244291, "percentage": 23.66, "elapsed_time": "2:40:27", "remaining_time": "8:37:51"} |
|
{"current_steps": 780, "total_steps": 3255, "loss": 0.0367, "lr": 9.41881560305262e-05, "epoch": 1.1974668969487623, "percentage": 23.96, "elapsed_time": "2:41:55", "remaining_time": "8:33:49"} |
|
{"current_steps": 790, "total_steps": 3255, "loss": 0.0384, "lr": 9.393467000496344e-05, "epoch": 1.2128190366532334, "percentage": 24.27, "elapsed_time": "2:43:24", "remaining_time": "8:29:52"} |
|
{"current_steps": 800, "total_steps": 3255, "loss": 0.0336, "lr": 9.367612964226218e-05, "epoch": 1.2281711763577048, "percentage": 24.58, "elapsed_time": "2:44:52", "remaining_time": "8:25:58"} |
|
{"current_steps": 800, "total_steps": 3255, "eval_loss": 0.04084751009941101, "epoch": 1.2281711763577048, "percentage": 24.58, "elapsed_time": "2:47:56", "remaining_time": "8:35:21"} |
|
{"current_steps": 810, "total_steps": 3255, "loss": 0.0262, "lr": 9.341256468545122e-05, "epoch": 1.2435233160621761, "percentage": 24.88, "elapsed_time": "2:49:27", "remaining_time": "8:31:31"} |
|
{"current_steps": 820, "total_steps": 3255, "loss": 0.0292, "lr": 9.314400545559934e-05, "epoch": 1.2588754557666475, "percentage": 25.19, "elapsed_time": "2:50:56", "remaining_time": "8:27:36"} |
|
{"current_steps": 830, "total_steps": 3255, "loss": 0.0352, "lr": 9.287048284832698e-05, "epoch": 1.2742275954711189, "percentage": 25.5, "elapsed_time": "2:52:24", "remaining_time": "8:23:43"} |
|
{"current_steps": 840, "total_steps": 3255, "loss": 0.0328, "lr": 9.2592028330252e-05, "epoch": 1.28957973517559, "percentage": 25.81, "elapsed_time": "2:53:53", "remaining_time": "8:19:56"} |
|
{"current_steps": 850, "total_steps": 3255, "loss": 0.0342, "lr": 9.230867393536972e-05, "epoch": 1.3049318748800613, "percentage": 26.11, "elapsed_time": "2:55:22", "remaining_time": "8:16:11"} |
|
{"current_steps": 850, "total_steps": 3255, "eval_loss": 0.041351333260536194, "epoch": 1.3049318748800613, "percentage": 26.11, "elapsed_time": "2:58:25", "remaining_time": "8:24:50"} |
|
{"current_steps": 860, "total_steps": 3255, "loss": 0.0308, "lr": 9.202045226136757e-05, "epoch": 1.3202840145845327, "percentage": 26.42, "elapsed_time": "2:59:57", "remaining_time": "8:21:10"} |
|
{"current_steps": 870, "total_steps": 3255, "loss": 0.0236, "lr": 9.172739646587509e-05, "epoch": 1.335636154289004, "percentage": 26.73, "elapsed_time": "3:01:26", "remaining_time": "8:17:23"} |
|
{"current_steps": 880, "total_steps": 3255, "loss": 0.0305, "lr": 9.142954026264931e-05, "epoch": 1.3509882939934754, "percentage": 27.04, "elapsed_time": "3:02:54", "remaining_time": "8:13:37"} |
|
{"current_steps": 890, "total_steps": 3255, "loss": 0.0259, "lr": 9.112691791769634e-05, "epoch": 1.3663404336979466, "percentage": 27.34, "elapsed_time": "3:04:21", "remaining_time": "8:09:55"} |
|
{"current_steps": 900, "total_steps": 3255, "loss": 0.0307, "lr": 9.081956424532926e-05, "epoch": 1.381692573402418, "percentage": 27.65, "elapsed_time": "3:05:50", "remaining_time": "8:06:16"} |
|
{"current_steps": 900, "total_steps": 3255, "eval_loss": 0.04069655388593674, "epoch": 1.381692573402418, "percentage": 27.65, "elapsed_time": "3:08:53", "remaining_time": "8:14:15"} |
|
{"current_steps": 910, "total_steps": 3255, "loss": 0.0351, "lr": 9.050751460416305e-05, "epoch": 1.3970447131068893, "percentage": 27.96, "elapsed_time": "3:10:25", "remaining_time": "8:10:41"} |
|
{"current_steps": 920, "total_steps": 3255, "loss": 0.0365, "lr": 9.019080489304685e-05, "epoch": 1.4123968528113606, "percentage": 28.26, "elapsed_time": "3:11:53", "remaining_time": "8:07:01"} |
|
{"current_steps": 930, "total_steps": 3255, "loss": 0.0514, "lr": 8.986947154693408e-05, "epoch": 1.427748992515832, "percentage": 28.57, "elapsed_time": "3:13:21", "remaining_time": "8:03:24"} |
|
{"current_steps": 940, "total_steps": 3255, "loss": 0.0431, "lr": 8.954355153269088e-05, "epoch": 1.4431011322203031, "percentage": 28.88, "elapsed_time": "3:14:49", "remaining_time": "7:59:49"} |
|
{"current_steps": 950, "total_steps": 3255, "loss": 0.0312, "lr": 8.921308234484336e-05, "epoch": 1.4584532719247745, "percentage": 29.19, "elapsed_time": "3:16:17", "remaining_time": "7:56:15"} |
|
{"current_steps": 950, "total_steps": 3255, "eval_loss": 0.0378691703081131, "epoch": 1.4584532719247745, "percentage": 29.19, "elapsed_time": "3:19:20", "remaining_time": "8:03:40"} |
|
{"current_steps": 960, "total_steps": 3255, "loss": 0.0333, "lr": 8.887810200126419e-05, "epoch": 1.4738054116292458, "percentage": 29.49, "elapsed_time": "3:20:52", "remaining_time": "8:00:12"} |
|
{"current_steps": 970, "total_steps": 3255, "loss": 0.0381, "lr": 8.853864903879889e-05, "epoch": 1.4891575513337172, "percentage": 29.8, "elapsed_time": "3:22:20", "remaining_time": "7:56:39"} |
|
{"current_steps": 980, "total_steps": 3255, "loss": 0.0371, "lr": 8.81947625088325e-05, "epoch": 1.5045096910381885, "percentage": 30.11, "elapsed_time": "3:23:48", "remaining_time": "7:53:07"} |
|
{"current_steps": 990, "total_steps": 3255, "loss": 0.0327, "lr": 8.784648197279701e-05, "epoch": 1.5198618307426597, "percentage": 30.41, "elapsed_time": "3:25:16", "remaining_time": "7:49:38"} |
|
{"current_steps": 1000, "total_steps": 3255, "loss": 0.0314, "lr": 8.749384749762015e-05, "epoch": 1.535213970447131, "percentage": 30.72, "elapsed_time": "3:26:44", "remaining_time": "7:46:11"} |
|
{"current_steps": 1000, "total_steps": 3255, "eval_loss": 0.0391918309032917, "epoch": 1.535213970447131, "percentage": 30.72, "elapsed_time": "3:29:47", "remaining_time": "7:53:05"} |
|
{"current_steps": 1010, "total_steps": 3255, "loss": 0.0248, "lr": 8.713689965111602e-05, "epoch": 1.5505661101516024, "percentage": 31.03, "elapsed_time": "3:31:19", "remaining_time": "7:49:43"} |
|
{"current_steps": 1020, "total_steps": 3255, "loss": 0.0385, "lr": 8.677567949731801e-05, "epoch": 1.5659182498560735, "percentage": 31.34, "elapsed_time": "3:32:46", "remaining_time": "7:46:14"} |
|
{"current_steps": 1030, "total_steps": 3255, "loss": 0.0482, "lr": 8.64102285917548e-05, "epoch": 1.581270389560545, "percentage": 31.64, "elapsed_time": "3:34:14", "remaining_time": "7:42:47"} |
|
{"current_steps": 1040, "total_steps": 3255, "loss": 0.0339, "lr": 8.604058897666962e-05, "epoch": 1.5966225292650162, "percentage": 31.95, "elapsed_time": "3:35:42", "remaining_time": "7:39:25"} |
|
{"current_steps": 1050, "total_steps": 3255, "loss": 0.0229, "lr": 8.566680317618377e-05, "epoch": 1.6119746689694876, "percentage": 32.26, "elapsed_time": "3:37:10", "remaining_time": "7:36:03"} |
|
{"current_steps": 1050, "total_steps": 3255, "eval_loss": 0.0367230549454689, "epoch": 1.6119746689694876, "percentage": 32.26, "elapsed_time": "3:40:13", "remaining_time": "7:42:28"} |
|
{"current_steps": 1060, "total_steps": 3255, "loss": 0.0397, "lr": 8.528891419140438e-05, "epoch": 1.627326808673959, "percentage": 32.57, "elapsed_time": "3:41:44", "remaining_time": "7:39:11"} |
|
{"current_steps": 1070, "total_steps": 3255, "loss": 0.0286, "lr": 8.490696549547761e-05, "epoch": 1.64267894837843, "percentage": 32.87, "elapsed_time": "3:43:12", "remaining_time": "7:35:48"} |
|
{"current_steps": 1080, "total_steps": 3255, "loss": 0.0398, "lr": 8.452100102858734e-05, "epoch": 1.6580310880829017, "percentage": 33.18, "elapsed_time": "3:44:39", "remaining_time": "7:32:27"} |
|
{"current_steps": 1090, "total_steps": 3255, "loss": 0.0325, "lr": 8.413106519290023e-05, "epoch": 1.6733832277873728, "percentage": 33.49, "elapsed_time": "3:46:07", "remaining_time": "7:29:08"} |
|
{"current_steps": 1100, "total_steps": 3255, "loss": 0.0337, "lr": 8.373720284745757e-05, "epoch": 1.6887353674918442, "percentage": 33.79, "elapsed_time": "3:47:36", "remaining_time": "7:25:53"} |
|
{"current_steps": 1100, "total_steps": 3255, "eval_loss": 0.03723842650651932, "epoch": 1.6887353674918442, "percentage": 33.79, "elapsed_time": "3:50:39", "remaining_time": "7:31:52"} |
|
{"current_steps": 1110, "total_steps": 3255, "loss": 0.0312, "lr": 8.333945930301459e-05, "epoch": 1.7040875071963155, "percentage": 34.1, "elapsed_time": "3:52:11", "remaining_time": "7:28:40"} |
|
{"current_steps": 1120, "total_steps": 3255, "loss": 0.0314, "lr": 8.293788031682789e-05, "epoch": 1.7194396469007867, "percentage": 34.41, "elapsed_time": "3:53:38", "remaining_time": "7:25:23"} |
|
{"current_steps": 1130, "total_steps": 3255, "loss": 0.0321, "lr": 8.253251208739137e-05, "epoch": 1.7347917866052582, "percentage": 34.72, "elapsed_time": "3:55:07", "remaining_time": "7:22:08"} |
|
{"current_steps": 1140, "total_steps": 3255, "loss": 0.0313, "lr": 8.21234012491215e-05, "epoch": 1.7501439263097294, "percentage": 35.02, "elapsed_time": "3:56:35", "remaining_time": "7:18:55"} |
|
{"current_steps": 1150, "total_steps": 3255, "loss": 0.028, "lr": 8.171059486699224e-05, "epoch": 1.7654960660142007, "percentage": 35.33, "elapsed_time": "3:58:03", "remaining_time": "7:15:45"} |
|
{"current_steps": 1150, "total_steps": 3255, "eval_loss": 0.03788375481963158, "epoch": 1.7654960660142007, "percentage": 35.33, "elapsed_time": "4:01:06", "remaining_time": "7:21:19"} |
|
{"current_steps": 1160, "total_steps": 3255, "loss": 0.0343, "lr": 8.129414043112087e-05, "epoch": 1.780848205718672, "percentage": 35.64, "elapsed_time": "4:02:39", "remaining_time": "7:18:14"} |
|
{"current_steps": 1170, "total_steps": 3255, "loss": 0.0262, "lr": 8.087408585130438e-05, "epoch": 1.7962003454231432, "percentage": 35.94, "elapsed_time": "4:04:07", "remaining_time": "7:15:02"} |
|
{"current_steps": 1180, "total_steps": 3255, "loss": 0.0334, "lr": 8.045047945150796e-05, "epoch": 1.8115524851276148, "percentage": 36.25, "elapsed_time": "4:05:35", "remaining_time": "7:11:51"} |
|
{"current_steps": 1190, "total_steps": 3255, "loss": 0.034, "lr": 8.002336996430561e-05, "epoch": 1.826904624832086, "percentage": 36.56, "elapsed_time": "4:07:03", "remaining_time": "7:08:42"} |
|
{"current_steps": 1200, "total_steps": 3255, "loss": 0.0191, "lr": 7.959280652527394e-05, "epoch": 1.8422567645365573, "percentage": 36.87, "elapsed_time": "4:08:30", "remaining_time": "7:05:34"} |
|
{"current_steps": 1200, "total_steps": 3255, "eval_loss": 0.03879622742533684, "epoch": 1.8422567645365573, "percentage": 36.87, "elapsed_time": "4:11:33", "remaining_time": "7:10:47"} |
|
{"current_steps": 1210, "total_steps": 3255, "loss": 0.036, "lr": 7.915883866733946e-05, "epoch": 1.8576089042410286, "percentage": 37.17, "elapsed_time": "4:13:04", "remaining_time": "7:07:42"} |
|
{"current_steps": 1220, "total_steps": 3255, "loss": 0.031, "lr": 7.872151631508022e-05, "epoch": 1.8729610439454998, "percentage": 37.48, "elapsed_time": "4:14:31", "remaining_time": "7:04:33"} |
|
{"current_steps": 1230, "total_steps": 3255, "loss": 0.033, "lr": 7.828088977898234e-05, "epoch": 1.8883131836499714, "percentage": 37.79, "elapsed_time": "4:15:59", "remaining_time": "7:01:26"} |
|
{"current_steps": 1240, "total_steps": 3255, "loss": 0.0449, "lr": 7.783700974965225e-05, "epoch": 1.9036653233544425, "percentage": 38.1, "elapsed_time": "4:17:27", "remaining_time": "6:58:22"} |
|
{"current_steps": 1250, "total_steps": 3255, "loss": 0.0348, "lr": 7.738992729198511e-05, "epoch": 1.9190174630589139, "percentage": 38.4, "elapsed_time": "4:18:55", "remaining_time": "6:55:18"} |
|
{"current_steps": 1250, "total_steps": 3255, "eval_loss": 0.04106801748275757, "epoch": 1.9190174630589139, "percentage": 38.4, "elapsed_time": "4:21:57", "remaining_time": "7:00:11"} |
|
{"current_steps": 1260, "total_steps": 3255, "loss": 0.0232, "lr": 7.693969383929017e-05, "epoch": 1.9343696027633852, "percentage": 38.71, "elapsed_time": "4:23:29", "remaining_time": "6:57:11"} |
|
{"current_steps": 1270, "total_steps": 3255, "loss": 0.0379, "lr": 7.648636118737385e-05, "epoch": 1.9497217424678563, "percentage": 39.02, "elapsed_time": "4:24:57", "remaining_time": "6:54:08"} |
|
{"current_steps": 1280, "total_steps": 3255, "loss": 0.0288, "lr": 7.602998148858089e-05, "epoch": 1.965073882172328, "percentage": 39.32, "elapsed_time": "4:26:24", "remaining_time": "6:51:04"} |
|
{"current_steps": 1290, "total_steps": 3255, "loss": 0.0315, "lr": 7.557060724579484e-05, "epoch": 1.980426021876799, "percentage": 39.63, "elapsed_time": "4:27:52", "remaining_time": "6:48:03"} |
|
{"current_steps": 1300, "total_steps": 3255, "loss": 0.0469, "lr": 7.51082913063978e-05, "epoch": 1.9957781615812704, "percentage": 39.94, "elapsed_time": "4:29:20", "remaining_time": "6:45:03"} |
|
{"current_steps": 1300, "total_steps": 3255, "eval_loss": 0.03991750255227089, "epoch": 1.9957781615812704, "percentage": 39.94, "elapsed_time": "4:32:23", "remaining_time": "6:49:38"} |
|
{"current_steps": 1310, "total_steps": 3255, "loss": 0.026, "lr": 7.464308685619099e-05, "epoch": 2.0111303012857418, "percentage": 40.25, "elapsed_time": "4:33:54", "remaining_time": "6:46:41"} |
|
{"current_steps": 1320, "total_steps": 3255, "loss": 0.0166, "lr": 7.417504741327587e-05, "epoch": 2.026482440990213, "percentage": 40.55, "elapsed_time": "4:35:22", "remaining_time": "6:43:40"} |
|
{"current_steps": 1330, "total_steps": 3255, "loss": 0.0212, "lr": 7.370422682189755e-05, "epoch": 2.0418345806946845, "percentage": 40.86, "elapsed_time": "4:36:50", "remaining_time": "6:40:41"} |
|
{"current_steps": 1340, "total_steps": 3255, "loss": 0.0163, "lr": 7.323067924625024e-05, "epoch": 2.0571867203991556, "percentage": 41.17, "elapsed_time": "4:38:17", "remaining_time": "6:37:42"} |
|
{"current_steps": 1350, "total_steps": 3255, "loss": 0.0193, "lr": 7.275445916424627e-05, "epoch": 2.0725388601036268, "percentage": 41.47, "elapsed_time": "4:39:45", "remaining_time": "6:34:46"} |
|
{"current_steps": 1350, "total_steps": 3255, "eval_loss": 0.04122938960790634, "epoch": 2.0725388601036268, "percentage": 41.47, "elapsed_time": "4:42:48", "remaining_time": "6:39:03"} |
|
{"current_steps": 1360, "total_steps": 3255, "loss": 0.0151, "lr": 7.227562136124864e-05, "epoch": 2.0878909998080983, "percentage": 41.78, "elapsed_time": "4:44:18", "remaining_time": "6:36:09"} |
|
{"current_steps": 1370, "total_steps": 3255, "loss": 0.0158, "lr": 7.179422092376856e-05, "epoch": 2.1032431395125695, "percentage": 42.09, "elapsed_time": "4:45:46", "remaining_time": "6:33:11"} |
|
{"current_steps": 1380, "total_steps": 3255, "loss": 0.0182, "lr": 7.13103132331281e-05, "epoch": 2.118595279217041, "percentage": 42.4, "elapsed_time": "4:47:13", "remaining_time": "6:30:14"} |
|
{"current_steps": 1390, "total_steps": 3255, "loss": 0.0232, "lr": 7.082395395908903e-05, "epoch": 2.133947418921512, "percentage": 42.7, "elapsed_time": "4:48:41", "remaining_time": "6:27:20"} |
|
{"current_steps": 1400, "total_steps": 3255, "loss": 0.0168, "lr": 7.033519905344846e-05, "epoch": 2.1492995586259833, "percentage": 43.01, "elapsed_time": "4:50:09", "remaining_time": "6:24:27"} |
|
{"current_steps": 1400, "total_steps": 3255, "eval_loss": 0.041591525077819824, "epoch": 2.1492995586259833, "percentage": 43.01, "elapsed_time": "4:53:11", "remaining_time": "6:28:28"} |
|
{"current_steps": 1410, "total_steps": 3255, "loss": 0.021, "lr": 6.984410474360195e-05, "epoch": 2.164651698330455, "percentage": 43.32, "elapsed_time": "4:54:42", "remaining_time": "6:25:37"} |
|
{"current_steps": 1420, "total_steps": 3255, "loss": 0.0253, "lr": 6.935072752607511e-05, "epoch": 2.180003838034926, "percentage": 43.63, "elapsed_time": "4:56:09", "remaining_time": "6:22:43"} |
|
{"current_steps": 1430, "total_steps": 3255, "loss": 0.0262, "lr": 6.885512416002412e-05, "epoch": 2.1953559777393976, "percentage": 43.93, "elapsed_time": "4:57:37", "remaining_time": "6:19:50"} |
|
{"current_steps": 1440, "total_steps": 3255, "loss": 0.0189, "lr": 6.835735166070587e-05, "epoch": 2.2107081174438687, "percentage": 44.24, "elapsed_time": "4:59:04", "remaining_time": "6:16:57"} |
|
{"current_steps": 1450, "total_steps": 3255, "loss": 0.019, "lr": 6.785746729291897e-05, "epoch": 2.22606025714834, "percentage": 44.55, "elapsed_time": "5:00:32", "remaining_time": "6:14:07"} |
|
{"current_steps": 1450, "total_steps": 3255, "eval_loss": 0.03900735080242157, "epoch": 2.22606025714834, "percentage": 44.55, "elapsed_time": "5:03:34", "remaining_time": "6:17:54"} |
|
{"current_steps": 1460, "total_steps": 3255, "loss": 0.0256, "lr": 6.735552856441585e-05, "epoch": 2.2414123968528115, "percentage": 44.85, "elapsed_time": "5:05:05", "remaining_time": "6:15:05"} |
|
{"current_steps": 1470, "total_steps": 3255, "loss": 0.0202, "lr": 6.685159321928691e-05, "epoch": 2.2567645365572826, "percentage": 45.16, "elapsed_time": "5:06:33", "remaining_time": "6:12:14"} |
|
{"current_steps": 1480, "total_steps": 3255, "loss": 0.0216, "lr": 6.634571923131756e-05, "epoch": 2.272116676261754, "percentage": 45.47, "elapsed_time": "5:08:00", "remaining_time": "6:09:24"} |
|
{"current_steps": 1490, "total_steps": 3255, "loss": 0.0197, "lr": 6.583796479731872e-05, "epoch": 2.2874688159662253, "percentage": 45.78, "elapsed_time": "5:09:28", "remaining_time": "6:06:35"} |
|
{"current_steps": 1500, "total_steps": 3255, "loss": 0.0268, "lr": 6.532838833043189e-05, "epoch": 2.3028209556706964, "percentage": 46.08, "elapsed_time": "5:10:56", "remaining_time": "6:03:47"} |
|
{"current_steps": 1500, "total_steps": 3255, "eval_loss": 0.03901956230401993, "epoch": 2.3028209556706964, "percentage": 46.08, "elapsed_time": "5:13:58", "remaining_time": "6:07:20"} |
|
{"current_steps": 1510, "total_steps": 3255, "loss": 0.0241, "lr": 6.481704845340894e-05, "epoch": 2.318173095375168, "percentage": 46.39, "elapsed_time": "5:15:30", "remaining_time": "6:04:36"} |
|
{"current_steps": 1520, "total_steps": 3255, "loss": 0.0212, "lr": 6.43040039918683e-05, "epoch": 2.333525235079639, "percentage": 46.7, "elapsed_time": "5:16:56", "remaining_time": "6:01:46"} |
|
{"current_steps": 1530, "total_steps": 3255, "loss": 0.0188, "lr": 6.37893139675273e-05, "epoch": 2.3488773747841103, "percentage": 47.0, "elapsed_time": "5:18:24", "remaining_time": "5:58:59"} |
|
{"current_steps": 1540, "total_steps": 3255, "loss": 0.0184, "lr": 6.327303759141235e-05, "epoch": 2.364229514488582, "percentage": 47.31, "elapsed_time": "5:19:52", "remaining_time": "5:56:12"} |
|
{"current_steps": 1550, "total_steps": 3255, "loss": 0.0221, "lr": 6.275523425704707e-05, "epoch": 2.379581654193053, "percentage": 47.62, "elapsed_time": "5:21:19", "remaining_time": "5:53:27"} |
|
{"current_steps": 1550, "total_steps": 3255, "eval_loss": 0.0411539301276207, "epoch": 2.379581654193053, "percentage": 47.62, "elapsed_time": "5:24:21", "remaining_time": "5:56:47"} |
|
{"current_steps": 1560, "total_steps": 3255, "loss": 0.0225, "lr": 6.223596353361961e-05, "epoch": 2.3949337938975246, "percentage": 47.93, "elapsed_time": "5:25:52", "remaining_time": "5:54:04"} |
|
{"current_steps": 1570, "total_steps": 3255, "loss": 0.0121, "lr": 6.171528515912965e-05, "epoch": 2.4102859336019957, "percentage": 48.23, "elapsed_time": "5:27:19", "remaining_time": "5:51:18"} |
|
{"current_steps": 1580, "total_steps": 3255, "loss": 0.0191, "lr": 6.119325903351599e-05, "epoch": 2.425638073306467, "percentage": 48.54, "elapsed_time": "5:28:47", "remaining_time": "5:48:33"} |
|
{"current_steps": 1590, "total_steps": 3255, "loss": 0.0256, "lr": 6.0669945211765585e-05, "epoch": 2.4409902130109384, "percentage": 48.85, "elapsed_time": "5:30:15", "remaining_time": "5:45:49"} |
|
{"current_steps": 1600, "total_steps": 3255, "loss": 0.0264, "lr": 6.0145403897004696e-05, "epoch": 2.4563423527154096, "percentage": 49.16, "elapsed_time": "5:31:42", "remaining_time": "5:43:06"} |
|
{"current_steps": 1600, "total_steps": 3255, "eval_loss": 0.0407683365046978, "epoch": 2.4563423527154096, "percentage": 49.16, "elapsed_time": "5:34:45", "remaining_time": "5:46:15"} |
|
{"current_steps": 1610, "total_steps": 3255, "loss": 0.0215, "lr": 5.961969543357292e-05, "epoch": 2.471694492419881, "percentage": 49.46, "elapsed_time": "5:36:16", "remaining_time": "5:43:35"} |
|
{"current_steps": 1620, "total_steps": 3255, "loss": 0.0237, "lr": 5.9092880300081123e-05, "epoch": 2.4870466321243523, "percentage": 49.77, "elapsed_time": "5:37:43", "remaining_time": "5:40:51"} |
|
{"current_steps": 1630, "total_steps": 3255, "loss": 0.0208, "lr": 5.8565019102453844e-05, "epoch": 2.5023987718288234, "percentage": 50.08, "elapsed_time": "5:39:11", "remaining_time": "5:38:08"} |
|
{"current_steps": 1640, "total_steps": 3255, "loss": 0.0211, "lr": 5.8036172566957006e-05, "epoch": 2.517750911533295, "percentage": 50.38, "elapsed_time": "5:40:38", "remaining_time": "5:35:27"} |
|
{"current_steps": 1650, "total_steps": 3255, "loss": 0.0248, "lr": 5.750640153321194e-05, "epoch": 2.533103051237766, "percentage": 50.69, "elapsed_time": "5:42:06", "remaining_time": "5:32:46"} |
|
{"current_steps": 1650, "total_steps": 3255, "eval_loss": 0.03897058963775635, "epoch": 2.533103051237766, "percentage": 50.69, "elapsed_time": "5:45:08", "remaining_time": "5:35:43"} |
|
{"current_steps": 1660, "total_steps": 3255, "loss": 0.0204, "lr": 5.697576694719616e-05, "epoch": 2.5484551909422377, "percentage": 51.0, "elapsed_time": "5:46:40", "remaining_time": "5:33:05"} |
|
{"current_steps": 1670, "total_steps": 3255, "loss": 0.0229, "lr": 5.644432985423206e-05, "epoch": 2.563807330646709, "percentage": 51.31, "elapsed_time": "5:48:06", "remaining_time": "5:30:23"} |
|
{"current_steps": 1680, "total_steps": 3255, "loss": 0.0227, "lr": 5.591215139196414e-05, "epoch": 2.57915947035118, "percentage": 51.61, "elapsed_time": "5:49:34", "remaining_time": "5:27:43"} |
|
{"current_steps": 1690, "total_steps": 3255, "loss": 0.0284, "lr": 5.5379292783325585e-05, "epoch": 2.5945116100556516, "percentage": 51.92, "elapsed_time": "5:51:01", "remaining_time": "5:25:03"} |
|
{"current_steps": 1700, "total_steps": 3255, "loss": 0.018, "lr": 5.4845815329495054e-05, "epoch": 2.6098637497601227, "percentage": 52.23, "elapsed_time": "5:52:29", "remaining_time": "5:22:25"} |
|
{"current_steps": 1700, "total_steps": 3255, "eval_loss": 0.039676472544670105, "epoch": 2.6098637497601227, "percentage": 52.23, "elapsed_time": "5:55:31", "remaining_time": "5:25:12"} |
|
{"current_steps": 1710, "total_steps": 3255, "loss": 0.0213, "lr": 5.431178040284446e-05, "epoch": 2.6252158894645943, "percentage": 52.53, "elapsed_time": "5:57:02", "remaining_time": "5:22:35"} |
|
{"current_steps": 1720, "total_steps": 3255, "loss": 0.0162, "lr": 5.377724943987855e-05, "epoch": 2.6405680291690654, "percentage": 52.84, "elapsed_time": "5:58:29", "remaining_time": "5:19:56"} |
|
{"current_steps": 1730, "total_steps": 3255, "loss": 0.0172, "lr": 5.324228393416718e-05, "epoch": 2.6559201688735365, "percentage": 53.15, "elapsed_time": "5:59:57", "remaining_time": "5:17:18"} |
|
{"current_steps": 1740, "total_steps": 3255, "loss": 0.0229, "lr": 5.270694542927088e-05, "epoch": 2.671272308578008, "percentage": 53.46, "elapsed_time": "6:01:25", "remaining_time": "5:14:41"} |
|
{"current_steps": 1750, "total_steps": 3255, "loss": 0.0148, "lr": 5.21712955116608e-05, "epoch": 2.6866244482824793, "percentage": 53.76, "elapsed_time": "6:02:52", "remaining_time": "5:12:04"} |
|
{"current_steps": 1750, "total_steps": 3255, "eval_loss": 0.04060601443052292, "epoch": 2.6866244482824793, "percentage": 53.76, "elapsed_time": "6:05:55", "remaining_time": "5:14:41"} |
|
{"current_steps": 1760, "total_steps": 3255, "loss": 0.02, "lr": 5.1635395803633666e-05, "epoch": 2.701976587986951, "percentage": 54.07, "elapsed_time": "6:07:27", "remaining_time": "5:12:08"} |
|
{"current_steps": 1770, "total_steps": 3255, "loss": 0.0159, "lr": 5.109930795622265e-05, "epoch": 2.717328727691422, "percentage": 54.38, "elapsed_time": "6:08:56", "remaining_time": "5:09:31"} |
|
{"current_steps": 1780, "total_steps": 3255, "loss": 0.0172, "lr": 5.056309364210483e-05, "epoch": 2.732680867395893, "percentage": 54.69, "elapsed_time": "6:10:24", "remaining_time": "5:06:56"} |
|
{"current_steps": 1790, "total_steps": 3255, "loss": 0.0261, "lr": 5.002681454850632e-05, "epoch": 2.7480330071003647, "percentage": 54.99, "elapsed_time": "6:11:52", "remaining_time": "5:04:21"} |
|
{"current_steps": 1800, "total_steps": 3255, "loss": 0.0228, "lr": 4.949053237010554e-05, "epoch": 2.763385146804836, "percentage": 55.3, "elapsed_time": "6:13:20", "remaining_time": "5:01:47"} |
|
{"current_steps": 1800, "total_steps": 3255, "eval_loss": 0.04158102348446846, "epoch": 2.763385146804836, "percentage": 55.3, "elapsed_time": "6:16:24", "remaining_time": "5:04:16"} |
|
{"current_steps": 1810, "total_steps": 3255, "loss": 0.0146, "lr": 4.89543088019359e-05, "epoch": 2.7787372865093074, "percentage": 55.61, "elapsed_time": "6:17:57", "remaining_time": "5:01:44"} |
|
{"current_steps": 1820, "total_steps": 3255, "loss": 0.0284, "lr": 4.841820553228805e-05, "epoch": 2.7940894262137785, "percentage": 55.91, "elapsed_time": "6:19:26", "remaining_time": "4:59:10"} |
|
{"current_steps": 1830, "total_steps": 3255, "loss": 0.0231, "lr": 4.7882284235613324e-05, "epoch": 2.8094415659182497, "percentage": 56.22, "elapsed_time": "6:20:55", "remaining_time": "4:56:37"} |
|
{"current_steps": 1840, "total_steps": 3255, "loss": 0.0205, "lr": 4.734660656542846e-05, "epoch": 2.8247937056227213, "percentage": 56.53, "elapsed_time": "6:22:24", "remaining_time": "4:54:04"} |
|
{"current_steps": 1850, "total_steps": 3255, "loss": 0.0216, "lr": 4.681123414722291e-05, "epoch": 2.8401458453271924, "percentage": 56.84, "elapsed_time": "6:23:53", "remaining_time": "4:51:33"} |
|
{"current_steps": 1850, "total_steps": 3255, "eval_loss": 0.039232347160577774, "epoch": 2.8401458453271924, "percentage": 56.84, "elapsed_time": "6:26:59", "remaining_time": "4:53:54"} |
|
{"current_steps": 1860, "total_steps": 3255, "loss": 0.0188, "lr": 4.627622857136929e-05, "epoch": 2.855497985031664, "percentage": 57.14, "elapsed_time": "6:28:33", "remaining_time": "4:51:24"} |
|
{"current_steps": 1870, "total_steps": 3255, "loss": 0.0257, "lr": 4.5741651386037883e-05, "epoch": 2.870850124736135, "percentage": 57.45, "elapsed_time": "6:30:02", "remaining_time": "4:48:52"} |
|
{"current_steps": 1880, "total_steps": 3255, "loss": 0.0181, "lr": 4.5207564090116064e-05, "epoch": 2.8862022644406062, "percentage": 57.76, "elapsed_time": "6:31:32", "remaining_time": "4:46:21"} |
|
{"current_steps": 1890, "total_steps": 3255, "loss": 0.0149, "lr": 4.467402812613323e-05, "epoch": 2.901554404145078, "percentage": 58.06, "elapsed_time": "6:33:01", "remaining_time": "4:43:51"} |
|
{"current_steps": 1900, "total_steps": 3255, "loss": 0.021, "lr": 4.414110487319244e-05, "epoch": 2.916906543849549, "percentage": 58.37, "elapsed_time": "6:34:30", "remaining_time": "4:41:21"} |
|
{"current_steps": 1900, "total_steps": 3255, "eval_loss": 0.03955698385834694, "epoch": 2.916906543849549, "percentage": 58.37, "elapsed_time": "6:37:38", "remaining_time": "4:43:34"} |
|
{"current_steps": 1910, "total_steps": 3255, "loss": 0.0214, "lr": 4.360885563990919e-05, "epoch": 2.9322586835540205, "percentage": 58.68, "elapsed_time": "6:39:11", "remaining_time": "4:41:06"} |
|
{"current_steps": 1920, "total_steps": 3255, "loss": 0.0137, "lr": 4.307734165735829e-05, "epoch": 2.9476108232584917, "percentage": 58.99, "elapsed_time": "6:40:41", "remaining_time": "4:38:36"} |
|
{"current_steps": 1930, "total_steps": 3255, "loss": 0.0217, "lr": 4.254662407202976e-05, "epoch": 2.962962962962963, "percentage": 59.29, "elapsed_time": "6:42:11", "remaining_time": "4:36:07"} |
|
{"current_steps": 1940, "total_steps": 3255, "loss": 0.019, "lr": 4.201676393879446e-05, "epoch": 2.9783151026674344, "percentage": 59.6, "elapsed_time": "6:43:42", "remaining_time": "4:33:38"} |
|
{"current_steps": 1950, "total_steps": 3255, "loss": 0.016, "lr": 4.148782221388007e-05, "epoch": 2.9936672423719055, "percentage": 59.91, "elapsed_time": "6:45:12", "remaining_time": "4:31:10"} |
|
{"current_steps": 1950, "total_steps": 3255, "eval_loss": 0.03930049389600754, "epoch": 2.9936672423719055, "percentage": 59.91, "elapsed_time": "6:48:21", "remaining_time": "4:33:17"} |
|
{"current_steps": 1960, "total_steps": 3255, "loss": 0.0102, "lr": 4.0959859747858706e-05, "epoch": 3.009019382076377, "percentage": 60.22, "elapsed_time": "6:49:55", "remaining_time": "4:30:50"} |
|
{"current_steps": 1970, "total_steps": 3255, "loss": 0.0077, "lr": 4.043293727864644e-05, "epoch": 3.0243715217808482, "percentage": 60.52, "elapsed_time": "6:51:26", "remaining_time": "4:28:22"} |
|
{"current_steps": 1980, "total_steps": 3255, "loss": 0.012, "lr": 3.990711542451591e-05, "epoch": 3.0397236614853194, "percentage": 60.83, "elapsed_time": "6:52:56", "remaining_time": "4:25:54"} |
|
{"current_steps": 1990, "total_steps": 3255, "loss": 0.0102, "lr": 3.9382454677122704e-05, "epoch": 3.055075801189791, "percentage": 61.14, "elapsed_time": "6:54:28", "remaining_time": "4:23:28"} |
|
{"current_steps": 2000, "total_steps": 3255, "loss": 0.0055, "lr": 3.885901539454623e-05, "epoch": 3.070427940894262, "percentage": 61.44, "elapsed_time": "6:55:59", "remaining_time": "4:21:02"} |
|
{"current_steps": 2000, "total_steps": 3255, "eval_loss": 0.044558048248291016, "epoch": 3.070427940894262, "percentage": 61.44, "elapsed_time": "6:59:09", "remaining_time": "4:23:01"} |
|
{"current_steps": 2010, "total_steps": 3255, "loss": 0.0119, "lr": 3.833685779434597e-05, "epoch": 3.0857800805987337, "percentage": 61.75, "elapsed_time": "7:00:44", "remaining_time": "4:20:36"} |
|
{"current_steps": 2020, "total_steps": 3255, "loss": 0.0081, "lr": 3.7816041946634024e-05, "epoch": 3.101132220303205, "percentage": 62.06, "elapsed_time": "7:02:15", "remaining_time": "4:18:09"} |
|
{"current_steps": 2030, "total_steps": 3255, "loss": 0.0091, "lr": 3.729662776716439e-05, "epoch": 3.116484360007676, "percentage": 62.37, "elapsed_time": "7:03:47", "remaining_time": "4:15:43"} |
|
{"current_steps": 2040, "total_steps": 3255, "loss": 0.0048, "lr": 3.677867501044029e-05, "epoch": 3.1318364997121475, "percentage": 62.67, "elapsed_time": "7:05:18", "remaining_time": "4:13:18"} |
|
{"current_steps": 2050, "total_steps": 3255, "loss": 0.0128, "lr": 3.6262243262839654e-05, "epoch": 3.1471886394166186, "percentage": 62.98, "elapsed_time": "7:06:49", "remaining_time": "4:10:53"} |
|
{"current_steps": 2050, "total_steps": 3255, "eval_loss": 0.046355538070201874, "epoch": 3.1471886394166186, "percentage": 62.98, "elapsed_time": "7:10:00", "remaining_time": "4:12:45"} |
|
{"current_steps": 2060, "total_steps": 3255, "loss": 0.0075, "lr": 3.574739193576042e-05, "epoch": 3.16254077912109, "percentage": 63.29, "elapsed_time": "7:11:35", "remaining_time": "4:10:21"} |
|
{"current_steps": 2070, "total_steps": 3255, "loss": 0.0072, "lr": 3.5234180258785554e-05, "epoch": 3.1778929188255614, "percentage": 63.59, "elapsed_time": "7:13:07", "remaining_time": "4:07:56"} |
|
{"current_steps": 2080, "total_steps": 3255, "loss": 0.0082, "lr": 3.472266727286928e-05, "epoch": 3.1932450585300325, "percentage": 63.9, "elapsed_time": "7:14:39", "remaining_time": "4:05:32"} |
|
{"current_steps": 2090, "total_steps": 3255, "loss": 0.0077, "lr": 3.4212911823544746e-05, "epoch": 3.208597198234504, "percentage": 64.21, "elapsed_time": "7:16:11", "remaining_time": "4:03:08"} |
|
{"current_steps": 2100, "total_steps": 3255, "loss": 0.0105, "lr": 3.370497255415443e-05, "epoch": 3.223949337938975, "percentage": 64.52, "elapsed_time": "7:17:43", "remaining_time": "4:00:45"} |
|
{"current_steps": 2100, "total_steps": 3255, "eval_loss": 0.046613357961177826, "epoch": 3.223949337938975, "percentage": 64.52, "elapsed_time": "7:20:54", "remaining_time": "4:02:30"} |
|
{"current_steps": 2110, "total_steps": 3255, "loss": 0.0125, "lr": 3.319890789910364e-05, "epoch": 3.239301477643447, "percentage": 64.82, "elapsed_time": "7:22:29", "remaining_time": "4:00:07"} |
|
{"current_steps": 2120, "total_steps": 3255, "loss": 0.0114, "lr": 3.269477607713802e-05, "epoch": 3.254653617347918, "percentage": 65.13, "elapsed_time": "7:24:02", "remaining_time": "3:57:43"} |
|
{"current_steps": 2130, "total_steps": 3255, "loss": 0.0104, "lr": 3.219263508464614e-05, "epoch": 3.270005757052389, "percentage": 65.44, "elapsed_time": "7:25:34", "remaining_time": "3:55:20"} |
|
{"current_steps": 2140, "total_steps": 3255, "loss": 0.0081, "lr": 3.169254268898725e-05, "epoch": 3.2853578967568606, "percentage": 65.75, "elapsed_time": "7:27:07", "remaining_time": "3:52:57"} |
|
{"current_steps": 2150, "total_steps": 3255, "loss": 0.009, "lr": 3.119455642184572e-05, "epoch": 3.3007100364613318, "percentage": 66.05, "elapsed_time": "7:28:39", "remaining_time": "3:50:35"} |
|
{"current_steps": 2150, "total_steps": 3255, "eval_loss": 0.045028459280729294, "epoch": 3.3007100364613318, "percentage": 66.05, "elapsed_time": "7:31:51", "remaining_time": "3:52:14"} |
|
{"current_steps": 2160, "total_steps": 3255, "loss": 0.0089, "lr": 3.069873357261249e-05, "epoch": 3.3160621761658033, "percentage": 66.36, "elapsed_time": "7:33:27", "remaining_time": "3:49:52"} |
|
{"current_steps": 2170, "total_steps": 3255, "loss": 0.0126, "lr": 3.020513118179428e-05, "epoch": 3.3314143158702745, "percentage": 66.67, "elapsed_time": "7:35:00", "remaining_time": "3:47:30"} |
|
{"current_steps": 2180, "total_steps": 3255, "loss": 0.0086, "lr": 2.9713806034451652e-05, "epoch": 3.3467664555747456, "percentage": 66.97, "elapsed_time": "7:36:32", "remaining_time": "3:45:07"} |
|
{"current_steps": 2190, "total_steps": 3255, "loss": 0.0093, "lr": 2.9224814653666242e-05, "epoch": 3.362118595279217, "percentage": 67.28, "elapsed_time": "7:38:05", "remaining_time": "3:42:46"} |
|
{"current_steps": 2200, "total_steps": 3255, "loss": 0.0087, "lr": 2.8738213294038212e-05, "epoch": 3.3774707349836883, "percentage": 67.59, "elapsed_time": "7:39:37", "remaining_time": "3:40:24"} |
|
{"current_steps": 2200, "total_steps": 3255, "eval_loss": 0.04871184378862381, "epoch": 3.3774707349836883, "percentage": 67.59, "elapsed_time": "7:42:50", "remaining_time": "3:41:57"} |
|
{"current_steps": 2210, "total_steps": 3255, "loss": 0.0092, "lr": 2.8254057935214735e-05, "epoch": 3.39282287468816, "percentage": 67.9, "elapsed_time": "7:44:26", "remaining_time": "3:39:36"} |
|
{"current_steps": 2220, "total_steps": 3255, "loss": 0.0099, "lr": 2.7772404275449825e-05, "epoch": 3.408175014392631, "percentage": 68.2, "elapsed_time": "7:45:59", "remaining_time": "3:37:15"} |
|
{"current_steps": 2230, "total_steps": 3255, "loss": 0.0082, "lr": 2.7293307725196793e-05, "epoch": 3.423527154097102, "percentage": 68.51, "elapsed_time": "7:47:32", "remaining_time": "3:34:53"} |
|
{"current_steps": 2240, "total_steps": 3255, "loss": 0.0075, "lr": 2.6816823400733625e-05, "epoch": 3.4388792938015738, "percentage": 68.82, "elapsed_time": "7:49:05", "remaining_time": "3:32:33"} |
|
{"current_steps": 2250, "total_steps": 3255, "loss": 0.0102, "lr": 2.6343006117822437e-05, "epoch": 3.454231433506045, "percentage": 69.12, "elapsed_time": "7:50:38", "remaining_time": "3:30:13"} |
|
{"current_steps": 2250, "total_steps": 3255, "eval_loss": 0.04728643596172333, "epoch": 3.454231433506045, "percentage": 69.12, "elapsed_time": "7:53:52", "remaining_time": "3:31:40"} |
|
{"current_steps": 2260, "total_steps": 3255, "loss": 0.0091, "lr": 2.587191038540317e-05, "epoch": 3.469583573210516, "percentage": 69.43, "elapsed_time": "7:55:28", "remaining_time": "3:29:20"} |
|
{"current_steps": 2270, "total_steps": 3255, "loss": 0.003, "lr": 2.5403590399322886e-05, "epoch": 3.4849357129149876, "percentage": 69.74, "elapsed_time": "7:57:02", "remaining_time": "3:26:59"} |
|
{"current_steps": 2280, "total_steps": 3255, "loss": 0.0088, "lr": 2.493810003610092e-05, "epoch": 3.5002878526194587, "percentage": 70.05, "elapsed_time": "7:58:36", "remaining_time": "3:24:40"} |
|
{"current_steps": 2290, "total_steps": 3255, "loss": 0.012, "lr": 2.4475492846730835e-05, "epoch": 3.51563999232393, "percentage": 70.35, "elapsed_time": "8:00:10", "remaining_time": "3:22:20"} |
|
{"current_steps": 2300, "total_steps": 3255, "loss": 0.007, "lr": 2.4015822050519794e-05, "epoch": 3.5309921320284015, "percentage": 70.66, "elapsed_time": "8:01:44", "remaining_time": "3:20:01"} |
|
{"current_steps": 2300, "total_steps": 3255, "eval_loss": 0.04855369031429291, "epoch": 3.5309921320284015, "percentage": 70.66, "elapsed_time": "8:04:58", "remaining_time": "3:21:22"} |
|
{"current_steps": 2310, "total_steps": 3255, "loss": 0.0051, "lr": 2.3559140528966074e-05, "epoch": 3.546344271732873, "percentage": 70.97, "elapsed_time": "8:06:34", "remaining_time": "3:19:03"} |
|
{"current_steps": 2320, "total_steps": 3255, "loss": 0.0087, "lr": 2.3105500819675495e-05, "epoch": 3.561696411437344, "percentage": 71.27, "elapsed_time": "8:08:09", "remaining_time": "3:16:44"} |
|
{"current_steps": 2330, "total_steps": 3255, "loss": 0.0113, "lr": 2.265495511031742e-05, "epoch": 3.5770485511418153, "percentage": 71.58, "elapsed_time": "8:09:42", "remaining_time": "3:14:24"} |
|
{"current_steps": 2340, "total_steps": 3255, "loss": 0.0101, "lr": 2.2207555232620893e-05, "epoch": 3.5924006908462864, "percentage": 71.89, "elapsed_time": "8:11:17", "remaining_time": "3:12:06"} |
|
{"current_steps": 2350, "total_steps": 3255, "loss": 0.0113, "lr": 2.1763352656411785e-05, "epoch": 3.607752830550758, "percentage": 72.2, "elapsed_time": "8:12:51", "remaining_time": "3:09:48"} |
|
{"current_steps": 2350, "total_steps": 3255, "eval_loss": 0.048977114260196686, "epoch": 3.607752830550758, "percentage": 72.2, "elapsed_time": "8:16:06", "remaining_time": "3:11:03"} |
|
{"current_steps": 2360, "total_steps": 3255, "loss": 0.0045, "lr": 2.1322398483691787e-05, "epoch": 3.6231049702552296, "percentage": 72.5, "elapsed_time": "8:17:43", "remaining_time": "3:08:45"} |
|
{"current_steps": 2370, "total_steps": 3255, "loss": 0.0083, "lr": 2.08847434427593e-05, "epoch": 3.6384571099597007, "percentage": 72.81, "elapsed_time": "8:19:17", "remaining_time": "3:06:26"} |
|
{"current_steps": 2380, "total_steps": 3255, "loss": 0.0065, "lr": 2.0450437882373697e-05, "epoch": 3.653809249664172, "percentage": 73.12, "elapsed_time": "8:20:51", "remaining_time": "3:04:08"} |
|
{"current_steps": 2390, "total_steps": 3255, "loss": 0.0086, "lr": 2.0019531765962995e-05, "epoch": 3.669161389368643, "percentage": 73.43, "elapsed_time": "8:22:24", "remaining_time": "3:01:50"} |
|
{"current_steps": 2400, "total_steps": 3255, "loss": 0.0066, "lr": 1.9592074665876026e-05, "epoch": 3.6845135290731146, "percentage": 73.73, "elapsed_time": "8:23:58", "remaining_time": "2:59:32"} |
|
{"current_steps": 2400, "total_steps": 3255, "eval_loss": 0.05218956619501114, "epoch": 3.6845135290731146, "percentage": 73.73, "elapsed_time": "8:27:14", "remaining_time": "3:00:42"} |
|
{"current_steps": 2410, "total_steps": 3255, "loss": 0.0091, "lr": 1.9168115757679535e-05, "epoch": 3.6998656687775857, "percentage": 74.04, "elapsed_time": "8:28:52", "remaining_time": "2:58:25"} |
|
{"current_steps": 2420, "total_steps": 3255, "loss": 0.0065, "lr": 1.8747703814500866e-05, "epoch": 3.7152178084820573, "percentage": 74.35, "elapsed_time": "8:30:26", "remaining_time": "2:56:07"} |
|
{"current_steps": 2430, "total_steps": 3255, "loss": 0.0058, "lr": 1.833088720141698e-05, "epoch": 3.7305699481865284, "percentage": 74.65, "elapsed_time": "8:32:01", "remaining_time": "2:53:50"} |
|
{"current_steps": 2440, "total_steps": 3255, "loss": 0.0085, "lr": 1.7917713869890557e-05, "epoch": 3.7459220878909996, "percentage": 74.96, "elapsed_time": "8:33:35", "remaining_time": "2:51:32"} |
|
{"current_steps": 2450, "total_steps": 3255, "loss": 0.0064, "lr": 1.7508231352253435e-05, "epoch": 3.761274227595471, "percentage": 75.27, "elapsed_time": "8:35:10", "remaining_time": "2:49:16"} |
|
{"current_steps": 2450, "total_steps": 3255, "eval_loss": 0.05100034922361374, "epoch": 3.761274227595471, "percentage": 75.27, "elapsed_time": "8:38:26", "remaining_time": "2:50:20"} |
|
{"current_steps": 2460, "total_steps": 3255, "loss": 0.007, "lr": 1.7102486756238435e-05, "epoch": 3.7766263672999423, "percentage": 75.58, "elapsed_time": "8:40:03", "remaining_time": "2:48:04"} |
|
{"current_steps": 2470, "total_steps": 3255, "loss": 0.0079, "lr": 1.6700526759560002e-05, "epoch": 3.791978507004414, "percentage": 75.88, "elapsed_time": "8:41:38", "remaining_time": "2:45:46"} |
|
{"current_steps": 2480, "total_steps": 3255, "loss": 0.0106, "lr": 1.6302397604544257e-05, "epoch": 3.807330646708885, "percentage": 76.19, "elapsed_time": "8:43:12", "remaining_time": "2:43:30"} |
|
{"current_steps": 2490, "total_steps": 3255, "loss": 0.0058, "lr": 1.5908145092809272e-05, "epoch": 3.822682786413356, "percentage": 76.5, "elapsed_time": "8:44:47", "remaining_time": "2:41:14"} |
|
{"current_steps": 2500, "total_steps": 3255, "loss": 0.0095, "lr": 1.551781457999586e-05, "epoch": 3.8380349261178277, "percentage": 76.8, "elapsed_time": "8:46:23", "remaining_time": "2:38:58"} |
|
{"current_steps": 2500, "total_steps": 3255, "eval_loss": 0.05139421671628952, "epoch": 3.8380349261178277, "percentage": 76.8, "elapsed_time": "8:49:39", "remaining_time": "2:39:57"} |
|
{"current_steps": 2510, "total_steps": 3255, "loss": 0.0076, "lr": 1.513145097054977e-05, "epoch": 3.853387065822299, "percentage": 77.11, "elapsed_time": "8:51:17", "remaining_time": "2:37:41"} |
|
{"current_steps": 2520, "total_steps": 3255, "loss": 0.0065, "lr": 1.4749098712555854e-05, "epoch": 3.8687392055267704, "percentage": 77.42, "elapsed_time": "8:52:52", "remaining_time": "2:35:25"} |
|
{"current_steps": 2530, "total_steps": 3255, "loss": 0.0043, "lr": 1.4370801792624656e-05, "epoch": 3.8840913452312416, "percentage": 77.73, "elapsed_time": "8:54:27", "remaining_time": "2:33:09"} |
|
{"current_steps": 2540, "total_steps": 3255, "loss": 0.0087, "lr": 1.399660373083203e-05, "epoch": 3.8994434849357127, "percentage": 78.03, "elapsed_time": "8:56:02", "remaining_time": "2:30:53"} |
|
{"current_steps": 2550, "total_steps": 3255, "loss": 0.0089, "lr": 1.3626547575712545e-05, "epoch": 3.9147956246401843, "percentage": 78.34, "elapsed_time": "8:57:38", "remaining_time": "2:28:38"} |
|
{"current_steps": 2550, "total_steps": 3255, "eval_loss": 0.052093155682086945, "epoch": 3.9147956246401843, "percentage": 78.34, "elapsed_time": "9:00:54", "remaining_time": "2:29:32"} |
|
{"current_steps": 2560, "total_steps": 3255, "loss": 0.0124, "lr": 1.3260675899307096e-05, "epoch": 3.9301477643446554, "percentage": 78.65, "elapsed_time": "9:02:32", "remaining_time": "2:27:17"} |
|
{"current_steps": 2570, "total_steps": 3255, "loss": 0.0068, "lr": 1.2899030792265349e-05, "epoch": 3.945499904049127, "percentage": 78.96, "elapsed_time": "9:04:07", "remaining_time": "2:25:01"} |
|
{"current_steps": 2580, "total_steps": 3255, "loss": 0.0096, "lr": 1.2541653859003437e-05, "epoch": 3.960852043753598, "percentage": 79.26, "elapsed_time": "9:05:42", "remaining_time": "2:22:46"} |
|
{"current_steps": 2590, "total_steps": 3255, "loss": 0.0111, "lr": 1.2188586212917846e-05, "epoch": 3.9762041834580693, "percentage": 79.57, "elapsed_time": "9:07:18", "remaining_time": "2:20:31"} |
|
{"current_steps": 2600, "total_steps": 3255, "loss": 0.0065, "lr": 1.1839868471655523e-05, "epoch": 3.991556323162541, "percentage": 79.88, "elapsed_time": "9:08:52", "remaining_time": "2:18:16"} |
|
{"current_steps": 2600, "total_steps": 3255, "eval_loss": 0.05236229673027992, "epoch": 3.991556323162541, "percentage": 79.88, "elapsed_time": "9:12:09", "remaining_time": "2:19:06"} |
|
{"current_steps": 2610, "total_steps": 3255, "loss": 0.0104, "lr": 1.1495540752441235e-05, "epoch": 4.006908462867012, "percentage": 80.18, "elapsed_time": "9:13:47", "remaining_time": "2:16:51"} |
|
{"current_steps": 2620, "total_steps": 3255, "loss": 0.0031, "lr": 1.1155642667462318e-05, "epoch": 4.0222606025714835, "percentage": 80.49, "elapsed_time": "9:15:23", "remaining_time": "2:14:36"} |
|
{"current_steps": 2630, "total_steps": 3255, "loss": 0.0052, "lr": 1.082021331931164e-05, "epoch": 4.037612742275955, "percentage": 80.8, "elapsed_time": "9:16:58", "remaining_time": "2:12:21"} |
|
{"current_steps": 2640, "total_steps": 3255, "loss": 0.0037, "lr": 1.0489291296489152e-05, "epoch": 4.052964881980426, "percentage": 81.11, "elapsed_time": "9:18:32", "remaining_time": "2:10:06"} |
|
{"current_steps": 2650, "total_steps": 3255, "loss": 0.0034, "lr": 1.0162914668962631e-05, "epoch": 4.068317021684897, "percentage": 81.41, "elapsed_time": "9:20:07", "remaining_time": "2:07:52"} |
|
{"current_steps": 2650, "total_steps": 3255, "eval_loss": 0.053961481899023056, "epoch": 4.068317021684897, "percentage": 81.41, "elapsed_time": "9:23:25", "remaining_time": "2:08:37"} |
|
{"current_steps": 2660, "total_steps": 3255, "loss": 0.0036, "lr": 9.841120983787915e-06, "epoch": 4.083669161389369, "percentage": 81.72, "elapsed_time": "9:25:03", "remaining_time": "2:06:23"} |
|
{"current_steps": 2670, "total_steps": 3255, "loss": 0.0024, "lr": 9.523947260789546e-06, "epoch": 4.09902130109384, "percentage": 82.03, "elapsed_time": "9:26:38", "remaining_time": "2:04:09"} |
|
{"current_steps": 2680, "total_steps": 3255, "loss": 0.0029, "lr": 9.211429988301823e-06, "epoch": 4.114373440798311, "percentage": 82.33, "elapsed_time": "9:28:13", "remaining_time": "2:01:54"} |
|
{"current_steps": 2690, "total_steps": 3255, "loss": 0.0049, "lr": 8.90360511897121e-06, "epoch": 4.129725580502782, "percentage": 82.64, "elapsed_time": "9:29:49", "remaining_time": "1:59:41"} |
|
{"current_steps": 2700, "total_steps": 3255, "loss": 0.0032, "lr": 8.600508065620161e-06, "epoch": 4.1450777202072535, "percentage": 82.95, "elapsed_time": "9:31:25", "remaining_time": "1:57:27"} |
|
{"current_steps": 2700, "total_steps": 3255, "eval_loss": 0.05632999911904335, "epoch": 4.1450777202072535, "percentage": 82.95, "elapsed_time": "9:34:42", "remaining_time": "1:58:08"} |
|
{"current_steps": 2710, "total_steps": 3255, "loss": 0.0032, "lr": 8.302173697173226e-06, "epoch": 4.1604298599117255, "percentage": 83.26, "elapsed_time": "9:36:20", "remaining_time": "1:55:54"} |
|
{"current_steps": 2720, "total_steps": 3255, "loss": 0.0038, "lr": 8.008636334645631e-06, "epoch": 4.175781999616197, "percentage": 83.56, "elapsed_time": "9:37:56", "remaining_time": "1:53:40"} |
|
{"current_steps": 2730, "total_steps": 3255, "loss": 0.0035, "lr": 7.71992974719491e-06, "epoch": 4.191134139320668, "percentage": 83.87, "elapsed_time": "9:39:32", "remaining_time": "1:51:27"} |
|
{"current_steps": 2740, "total_steps": 3255, "loss": 0.0018, "lr": 7.436087148236054e-06, "epoch": 4.206486279025139, "percentage": 84.18, "elapsed_time": "9:41:08", "remaining_time": "1:49:13"} |
|
{"current_steps": 2750, "total_steps": 3255, "loss": 0.0026, "lr": 7.157141191620548e-06, "epoch": 4.22183841872961, "percentage": 84.49, "elapsed_time": "9:42:44", "remaining_time": "1:47:00"} |
|
{"current_steps": 2750, "total_steps": 3255, "eval_loss": 0.05644020810723305, "epoch": 4.22183841872961, "percentage": 84.49, "elapsed_time": "9:46:01", "remaining_time": "1:47:36"} |
|
{"current_steps": 2760, "total_steps": 3255, "loss": 0.002, "lr": 6.883123967879796e-06, "epoch": 4.237190558434082, "percentage": 84.79, "elapsed_time": "9:47:39", "remaining_time": "1:45:23"} |
|
{"current_steps": 2770, "total_steps": 3255, "loss": 0.0011, "lr": 6.6140670005334136e-06, "epoch": 4.252542698138553, "percentage": 85.1, "elapsed_time": "9:49:15", "remaining_time": "1:43:10"} |
|
{"current_steps": 2780, "total_steps": 3255, "loss": 0.0024, "lr": 6.350001242462617e-06, "epoch": 4.267894837843024, "percentage": 85.41, "elapsed_time": "9:50:50", "remaining_time": "1:40:57"} |
|
{"current_steps": 2790, "total_steps": 3255, "loss": 0.0033, "lr": 6.090957072349385e-06, "epoch": 4.2832469775474955, "percentage": 85.71, "elapsed_time": "9:52:26", "remaining_time": "1:38:44"} |
|
{"current_steps": 2800, "total_steps": 3255, "loss": 0.0024, "lr": 5.836964291181624e-06, "epoch": 4.298599117251967, "percentage": 86.02, "elapsed_time": "9:54:01", "remaining_time": "1:36:31"} |
|
{"current_steps": 2800, "total_steps": 3255, "eval_loss": 0.058551765978336334, "epoch": 4.298599117251967, "percentage": 86.02, "elapsed_time": "9:57:19", "remaining_time": "1:37:03"} |
|
{"current_steps": 2810, "total_steps": 3255, "loss": 0.0019, "lr": 5.588052118824804e-06, "epoch": 4.313951256956439, "percentage": 86.33, "elapsed_time": "9:58:58", "remaining_time": "1:34:51"} |
|
{"current_steps": 2820, "total_steps": 3255, "loss": 0.0014, "lr": 5.344249190660428e-06, "epoch": 4.32930339666091, "percentage": 86.64, "elapsed_time": "10:00:34", "remaining_time": "1:32:38"} |
|
{"current_steps": 2830, "total_steps": 3255, "loss": 0.0023, "lr": 5.105583554291765e-06, "epoch": 4.344655536365381, "percentage": 86.94, "elapsed_time": "10:02:10", "remaining_time": "1:30:25"} |
|
{"current_steps": 2840, "total_steps": 3255, "loss": 0.0012, "lr": 4.872082666317207e-06, "epoch": 4.360007676069852, "percentage": 87.25, "elapsed_time": "10:03:45", "remaining_time": "1:28:13"} |
|
{"current_steps": 2850, "total_steps": 3255, "loss": 0.0021, "lr": 4.6437733891715905e-06, "epoch": 4.375359815774323, "percentage": 87.56, "elapsed_time": "10:05:21", "remaining_time": "1:26:01"} |
|
{"current_steps": 2850, "total_steps": 3255, "eval_loss": 0.059518758207559586, "epoch": 4.375359815774323, "percentage": 87.56, "elapsed_time": "10:08:39", "remaining_time": "1:26:29"} |
|
{"current_steps": 2860, "total_steps": 3255, "loss": 0.0016, "lr": 4.420681988035891e-06, "epoch": 4.390711955478795, "percentage": 87.86, "elapsed_time": "10:10:19", "remaining_time": "1:24:17"} |
|
{"current_steps": 2870, "total_steps": 3255, "loss": 0.0044, "lr": 4.2028341278156026e-06, "epoch": 4.406064095183266, "percentage": 88.17, "elapsed_time": "10:11:55", "remaining_time": "1:22:05"} |
|
{"current_steps": 2880, "total_steps": 3255, "loss": 0.0033, "lr": 3.990254870188221e-06, "epoch": 4.4214162348877375, "percentage": 88.48, "elapsed_time": "10:13:30", "remaining_time": "1:19:53"} |
|
{"current_steps": 2890, "total_steps": 3255, "loss": 0.0035, "lr": 3.7829686707200827e-06, "epoch": 4.436768374592209, "percentage": 88.79, "elapsed_time": "10:15:06", "remaining_time": "1:17:41"} |
|
{"current_steps": 2900, "total_steps": 3255, "loss": 0.0043, "lr": 3.580999376052946e-06, "epoch": 4.45212051429668, "percentage": 89.09, "elapsed_time": "10:16:43", "remaining_time": "1:15:29"} |
|
{"current_steps": 2900, "total_steps": 3255, "eval_loss": 0.06037411838769913, "epoch": 4.45212051429668, "percentage": 89.09, "elapsed_time": "10:20:01", "remaining_time": "1:15:54"} |
|
{"current_steps": 2910, "total_steps": 3255, "loss": 0.0024, "lr": 3.3843702211606153e-06, "epoch": 4.467472654001152, "percentage": 89.4, "elapsed_time": "10:21:40", "remaining_time": "1:13:42"} |
|
{"current_steps": 2920, "total_steps": 3255, "loss": 0.0055, "lr": 3.193103826675947e-06, "epoch": 4.482824793705623, "percentage": 89.71, "elapsed_time": "10:23:16", "remaining_time": "1:11:30"} |
|
{"current_steps": 2930, "total_steps": 3255, "loss": 0.0018, "lr": 3.007222196288545e-06, "epoch": 4.498176933410094, "percentage": 90.02, "elapsed_time": "10:24:54", "remaining_time": "1:09:18"} |
|
{"current_steps": 2940, "total_steps": 3255, "loss": 0.0014, "lr": 2.8267467142133687e-06, "epoch": 4.513529073114565, "percentage": 90.32, "elapsed_time": "10:26:30", "remaining_time": "1:07:07"} |
|
{"current_steps": 2950, "total_steps": 3255, "loss": 0.0019, "lr": 2.651698142730674e-06, "epoch": 4.528881212819036, "percentage": 90.63, "elapsed_time": "10:28:07", "remaining_time": "1:04:56"} |
|
{"current_steps": 2950, "total_steps": 3255, "eval_loss": 0.06066432595252991, "epoch": 4.528881212819036, "percentage": 90.63, "elapsed_time": "10:31:26", "remaining_time": "1:05:17"} |
|
{"current_steps": 2960, "total_steps": 3255, "loss": 0.0038, "lr": 2.4820966197974748e-06, "epoch": 4.544233352523508, "percentage": 90.94, "elapsed_time": "10:33:05", "remaining_time": "1:03:05"} |
|
{"current_steps": 2970, "total_steps": 3255, "loss": 0.0017, "lr": 2.3179616567308216e-06, "epoch": 4.5595854922279795, "percentage": 91.24, "elapsed_time": "10:34:41", "remaining_time": "1:00:54"} |
|
{"current_steps": 2980, "total_steps": 3255, "loss": 0.0023, "lr": 2.1593121359631873e-06, "epoch": 4.574937631932451, "percentage": 91.55, "elapsed_time": "10:36:17", "remaining_time": "0:58:43"} |
|
{"current_steps": 2990, "total_steps": 3255, "loss": 0.0017, "lr": 2.006166308870189e-06, "epoch": 4.590289771636922, "percentage": 91.86, "elapsed_time": "10:37:54", "remaining_time": "0:56:32"} |
|
{"current_steps": 3000, "total_steps": 3255, "loss": 0.0011, "lr": 1.8585417936709038e-06, "epoch": 4.605641911341393, "percentage": 92.17, "elapsed_time": "10:39:31", "remaining_time": "0:54:21"} |
|
{"current_steps": 3000, "total_steps": 3255, "eval_loss": 0.06103256344795227, "epoch": 4.605641911341393, "percentage": 92.17, "elapsed_time": "10:42:50", "remaining_time": "0:54:38"} |
|
{"current_steps": 3010, "total_steps": 3255, "loss": 0.0035, "lr": 1.7164555734010545e-06, "epoch": 4.620994051045864, "percentage": 92.47, "elapsed_time": "10:44:30", "remaining_time": "0:52:27"} |
|
{"current_steps": 3020, "total_steps": 3255, "loss": 0.0032, "lr": 1.5799239939592204e-06, "epoch": 4.636346190750336, "percentage": 92.78, "elapsed_time": "10:46:07", "remaining_time": "0:50:16"} |
|
{"current_steps": 3030, "total_steps": 3255, "loss": 0.0018, "lr": 1.4489627622263747e-06, "epoch": 4.651698330454807, "percentage": 93.09, "elapsed_time": "10:47:43", "remaining_time": "0:48:05"} |
|
{"current_steps": 3040, "total_steps": 3255, "loss": 0.0079, "lr": 1.3235869442589255e-06, "epoch": 4.667050470159278, "percentage": 93.39, "elapsed_time": "10:49:20", "remaining_time": "0:45:55"} |
|
{"current_steps": 3050, "total_steps": 3255, "loss": 0.0018, "lr": 1.2038109635555406e-06, "epoch": 4.6824026098637495, "percentage": 93.7, "elapsed_time": "10:50:56", "remaining_time": "0:43:45"} |
|
{"current_steps": 3050, "total_steps": 3255, "eval_loss": 0.061669450253248215, "epoch": 4.6824026098637495, "percentage": 93.7, "elapsed_time": "10:54:15", "remaining_time": "0:43:58"} |
|
{"current_steps": 3060, "total_steps": 3255, "loss": 0.0043, "lr": 1.0896485993977467e-06, "epoch": 4.697754749568221, "percentage": 94.01, "elapsed_time": "10:55:55", "remaining_time": "0:41:47"} |
|
{"current_steps": 3070, "total_steps": 3255, "loss": 0.0024, "lr": 9.811129852647982e-07, "epoch": 4.713106889272693, "percentage": 94.32, "elapsed_time": "10:57:32", "remaining_time": "0:39:37"} |
|
{"current_steps": 3080, "total_steps": 3255, "loss": 0.0043, "lr": 8.782166073227515e-07, "epoch": 4.728459028977164, "percentage": 94.62, "elapsed_time": "10:59:08", "remaining_time": "0:37:27"} |
|
{"current_steps": 3090, "total_steps": 3255, "loss": 0.0023, "lr": 7.809713029880428e-07, "epoch": 4.743811168681635, "percentage": 94.93, "elapsed_time": "11:00:45", "remaining_time": "0:35:16"} |
|
{"current_steps": 3100, "total_steps": 3255, "loss": 0.0051, "lr": 6.893882595656598e-07, "epoch": 4.759163308386106, "percentage": 95.24, "elapsed_time": "11:02:21", "remaining_time": "0:33:07"} |
|
{"current_steps": 3100, "total_steps": 3255, "eval_loss": 0.061440397053956985, "epoch": 4.759163308386106, "percentage": 95.24, "elapsed_time": "11:05:40", "remaining_time": "0:33:17"} |
|
{"current_steps": 3110, "total_steps": 3255, "loss": 0.005, "lr": 6.034780129621664e-07, "epoch": 4.774515448090577, "percentage": 95.55, "elapsed_time": "11:07:20", "remaining_time": "0:31:06"} |
|
{"current_steps": 3120, "total_steps": 3255, "loss": 0.0018, "lr": 5.232504464735833e-07, "epoch": 4.789867587795049, "percentage": 95.85, "elapsed_time": "11:08:56", "remaining_time": "0:28:56"} |
|
{"current_steps": 3130, "total_steps": 3255, "loss": 0.0027, "lr": 4.487147896484523e-07, "epoch": 4.80521972749952, "percentage": 96.16, "elapsed_time": "11:10:33", "remaining_time": "0:26:46"} |
|
{"current_steps": 3140, "total_steps": 3255, "loss": 0.0063, "lr": 3.7987961722599773e-07, "epoch": 4.8205718672039914, "percentage": 96.47, "elapsed_time": "11:12:10", "remaining_time": "0:24:37"} |
|
{"current_steps": 3150, "total_steps": 3255, "loss": 0.0032, "lr": 3.167528481496984e-07, "epoch": 4.835924006908463, "percentage": 96.77, "elapsed_time": "11:13:47", "remaining_time": "0:22:27"} |
|
{"current_steps": 3150, "total_steps": 3255, "eval_loss": 0.061653103679418564, "epoch": 4.835924006908463, "percentage": 96.77, "elapsed_time": "11:17:07", "remaining_time": "0:22:34"} |
|
{"current_steps": 3160, "total_steps": 3255, "loss": 0.0056, "lr": 2.593417446562607e-07, "epoch": 4.851276146612934, "percentage": 97.08, "elapsed_time": "11:18:46", "remaining_time": "0:20:24"} |
|
{"current_steps": 3170, "total_steps": 3255, "loss": 0.0011, "lr": 2.0765291144016486e-07, "epoch": 4.866628286317406, "percentage": 97.39, "elapsed_time": "11:20:23", "remaining_time": "0:18:14"} |
|
{"current_steps": 3180, "total_steps": 3255, "loss": 0.0031, "lr": 1.6169229489385595e-07, "epoch": 4.881980426021877, "percentage": 97.7, "elapsed_time": "11:22:00", "remaining_time": "0:16:05"} |
|
{"current_steps": 3190, "total_steps": 3255, "loss": 0.0019, "lr": 1.2146518242363014e-07, "epoch": 4.897332565726348, "percentage": 98.0, "elapsed_time": "11:23:37", "remaining_time": "0:13:55"} |
|
{"current_steps": 3200, "total_steps": 3255, "loss": 0.001, "lr": 8.697620184138222e-08, "epoch": 4.912684705430819, "percentage": 98.31, "elapsed_time": "11:25:14", "remaining_time": "0:11:46"} |
|
{"current_steps": 3200, "total_steps": 3255, "eval_loss": 0.06173569709062576, "epoch": 4.912684705430819, "percentage": 98.31, "elapsed_time": "11:28:32", "remaining_time": "0:11:50"} |
|
{"current_steps": 3210, "total_steps": 3255, "loss": 0.0029, "lr": 5.822932083221488e-08, "epoch": 4.92803684513529, "percentage": 98.62, "elapsed_time": "11:30:13", "remaining_time": "0:09:40"} |
|
{"current_steps": 3220, "total_steps": 3255, "loss": 0.002, "lr": 3.5227846497970504e-08, "epoch": 4.943388984839762, "percentage": 98.92, "elapsed_time": "11:31:51", "remaining_time": "0:07:31"} |
|
{"current_steps": 3230, "total_steps": 3255, "loss": 0.0016, "lr": 1.7974424976796577e-08, "epoch": 4.958741124544233, "percentage": 99.23, "elapsed_time": "11:33:28", "remaining_time": "0:05:22"} |
|
{"current_steps": 3240, "total_steps": 3255, "loss": 0.0035, "lr": 6.47104113870034e-09, "epoch": 4.974093264248705, "percentage": 99.54, "elapsed_time": "11:35:06", "remaining_time": "0:03:13"} |
|
{"current_steps": 3250, "total_steps": 3255, "loss": 0.0029, "lr": 7.190183572314269e-10, "epoch": 4.989445403953176, "percentage": 99.85, "elapsed_time": "11:36:43", "remaining_time": "0:01:04"} |
|
{"current_steps": 3250, "total_steps": 3255, "eval_loss": 0.06179765984416008, "epoch": 4.989445403953176, "percentage": 99.85, "elapsed_time": "11:40:03", "remaining_time": "0:01:04"} |
|
{"current_steps": 3255, "total_steps": 3255, "epoch": 4.997121473805412, "percentage": 100.0, "elapsed_time": "11:40:59", "remaining_time": "0:00:00"} |
|
|