{"current_steps": 10, "total_steps": 1092, "loss": 1.3621, "lr": 1.8181818181818182e-05, "epoch": 0.027472527472527472, "percentage": 0.92, "elapsed_time": "0:01:40", "remaining_time": "3:02:05"} {"current_steps": 20, "total_steps": 1092, "loss": 1.2798, "lr": 3.6363636363636364e-05, "epoch": 0.054945054945054944, "percentage": 1.83, "elapsed_time": "0:03:18", "remaining_time": "2:57:26"} {"current_steps": 25, "total_steps": 1092, "eval_loss": 1.2023646831512451, "epoch": 0.06868131868131869, "percentage": 2.29, "elapsed_time": "0:06:39", "remaining_time": "4:43:54"} {"current_steps": 30, "total_steps": 1092, "loss": 1.164, "lr": 5.4545454545454546e-05, "epoch": 0.08241758241758242, "percentage": 2.75, "elapsed_time": "0:07:30", "remaining_time": "4:25:39"} {"current_steps": 40, "total_steps": 1092, "loss": 1.1436, "lr": 7.272727272727273e-05, "epoch": 0.10989010989010989, "percentage": 3.66, "elapsed_time": "0:09:11", "remaining_time": "4:01:53"} {"current_steps": 50, "total_steps": 1092, "loss": 1.1131, "lr": 9.090909090909092e-05, "epoch": 0.13736263736263737, "percentage": 4.58, "elapsed_time": "0:10:49", "remaining_time": "3:45:41"} {"current_steps": 50, "total_steps": 1092, "eval_loss": 1.1125513315200806, "epoch": 0.13736263736263737, "percentage": 4.58, "elapsed_time": "0:13:22", "remaining_time": "4:38:52"} {"current_steps": 60, "total_steps": 1092, "loss": 1.1114, "lr": 0.00010909090909090909, "epoch": 0.16483516483516483, "percentage": 5.49, "elapsed_time": "0:15:00", "remaining_time": "4:18:16"} {"current_steps": 70, "total_steps": 1092, "loss": 1.0756, "lr": 0.00012727272727272728, "epoch": 0.19230769230769232, "percentage": 6.41, "elapsed_time": "0:16:41", "remaining_time": "4:03:46"} {"current_steps": 75, "total_steps": 1092, "eval_loss": 1.0798790454864502, "epoch": 0.20604395604395603, "percentage": 6.87, "elapsed_time": "0:20:05", "remaining_time": "4:32:26"} {"current_steps": 80, "total_steps": 1092, "loss": 1.072, "lr": 0.00014545454545454546, "epoch": 0.21978021978021978, "percentage": 7.33, "elapsed_time": "0:20:55", "remaining_time": "4:24:44"} {"current_steps": 90, "total_steps": 1092, "loss": 1.0546, "lr": 0.00016363636363636366, "epoch": 0.24725274725274726, "percentage": 8.24, "elapsed_time": "0:22:31", "remaining_time": "4:10:46"} {"current_steps": 100, "total_steps": 1092, "loss": 1.0443, "lr": 0.00018181818181818183, "epoch": 0.27472527472527475, "percentage": 9.16, "elapsed_time": "0:24:13", "remaining_time": "4:00:16"} {"current_steps": 100, "total_steps": 1092, "eval_loss": 1.0595930814743042, "epoch": 0.27472527472527475, "percentage": 9.16, "elapsed_time": "0:26:46", "remaining_time": "4:25:35"} {"current_steps": 110, "total_steps": 1092, "loss": 1.0549, "lr": 0.0002, "epoch": 0.3021978021978022, "percentage": 10.07, "elapsed_time": "0:28:27", "remaining_time": "4:14:01"} {"current_steps": 120, "total_steps": 1092, "loss": 1.0515, "lr": 0.00019994883066969053, "epoch": 0.32967032967032966, "percentage": 10.99, "elapsed_time": "0:30:05", "remaining_time": "4:03:41"} {"current_steps": 125, "total_steps": 1092, "eval_loss": 1.045371174812317, "epoch": 0.3434065934065934, "percentage": 11.45, "elapsed_time": "0:33:28", "remaining_time": "4:18:55"} {"current_steps": 130, "total_steps": 1092, "loss": 1.0425, "lr": 0.00019979537504476944, "epoch": 0.35714285714285715, "percentage": 11.9, "elapsed_time": "0:34:17", "remaining_time": "4:13:44"} {"current_steps": 140, "total_steps": 1092, "loss": 1.028, "lr": 0.00019953979016966788, "epoch": 0.38461538461538464, "percentage": 12.82, "elapsed_time": "0:35:55", "remaining_time": "4:04:19"} {"current_steps": 150, "total_steps": 1092, "loss": 1.0212, "lr": 0.0001991823376065238, "epoch": 0.41208791208791207, "percentage": 13.74, "elapsed_time": "0:37:39", "remaining_time": "3:56:30"} {"current_steps": 150, "total_steps": 1092, "eval_loss": 1.0323785543441772, "epoch": 0.41208791208791207, "percentage": 13.74, "elapsed_time": "0:40:12", "remaining_time": "4:12:31"} {"current_steps": 160, "total_steps": 1092, "loss": 1.0146, "lr": 0.00019872338316750265, "epoch": 0.43956043956043955, "percentage": 14.65, "elapsed_time": "0:41:52", "remaining_time": "4:03:52"} {"current_steps": 170, "total_steps": 1092, "loss": 1.0213, "lr": 0.00019816339654043022, "epoch": 0.46703296703296704, "percentage": 15.57, "elapsed_time": "0:43:29", "remaining_time": "3:55:51"} {"current_steps": 175, "total_steps": 1092, "eval_loss": 1.021622896194458, "epoch": 0.4807692307692308, "percentage": 16.03, "elapsed_time": "0:46:50", "remaining_time": "4:05:28"} {"current_steps": 180, "total_steps": 1092, "loss": 1.0352, "lr": 0.00019750295080812023, "epoch": 0.4945054945054945, "percentage": 16.48, "elapsed_time": "0:47:40", "remaining_time": "4:01:32"} {"current_steps": 190, "total_steps": 1092, "loss": 1.0003, "lr": 0.0001967427218618893, "epoch": 0.521978021978022, "percentage": 17.4, "elapsed_time": "0:49:19", "remaining_time": "3:54:08"} {"current_steps": 200, "total_steps": 1092, "loss": 1.0152, "lr": 0.0001958834877098586, "epoch": 0.5494505494505495, "percentage": 18.32, "elapsed_time": "0:50:59", "remaining_time": "3:47:27"} {"current_steps": 200, "total_steps": 1092, "eval_loss": 1.0108906030654907, "epoch": 0.5494505494505495, "percentage": 18.32, "elapsed_time": "0:53:32", "remaining_time": "3:58:49"} {"current_steps": 210, "total_steps": 1092, "loss": 1.0242, "lr": 0.00019492612768075092, "epoch": 0.5769230769230769, "percentage": 19.23, "elapsed_time": "0:55:08", "remaining_time": "3:51:36"} {"current_steps": 220, "total_steps": 1092, "loss": 1.0221, "lr": 0.0001938716215239974, "epoch": 0.6043956043956044, "percentage": 20.15, "elapsed_time": "0:56:44", "remaining_time": "3:44:54"} {"current_steps": 225, "total_steps": 1092, "eval_loss": 1.001078724861145, "epoch": 0.6181318681318682, "percentage": 20.6, "elapsed_time": "1:00:07", "remaining_time": "3:51:41"} {"current_steps": 230, "total_steps": 1092, "loss": 1.0029, "lr": 0.00019272104840707487, "epoch": 0.6318681318681318, "percentage": 21.06, "elapsed_time": "1:00:54", "remaining_time": "3:48:15"} {"current_steps": 240, "total_steps": 1092, "loss": 0.9949, "lr": 0.00019147558581110078, "epoch": 0.6593406593406593, "percentage": 21.98, "elapsed_time": "1:02:29", "remaining_time": "3:41:49"} {"current_steps": 250, "total_steps": 1092, "loss": 1.0017, "lr": 0.00019013650832581423, "epoch": 0.6868131868131868, "percentage": 22.89, "elapsed_time": "1:04:09", "remaining_time": "3:36:05"} {"current_steps": 250, "total_steps": 1092, "eval_loss": 0.9922270774841309, "epoch": 0.6868131868131868, "percentage": 22.89, "elapsed_time": "1:06:42", "remaining_time": "3:44:40"} {"current_steps": 260, "total_steps": 1092, "loss": 1.0029, "lr": 0.0001887051863451784, "epoch": 0.7142857142857143, "percentage": 23.81, "elapsed_time": "1:08:21", "remaining_time": "3:38:43"} {"current_steps": 270, "total_steps": 1092, "loss": 0.974, "lr": 0.00018718308466493744, "epoch": 0.7417582417582418, "percentage": 24.73, "elapsed_time": "1:09:56", "remaining_time": "3:32:54"} {"current_steps": 275, "total_steps": 1092, "eval_loss": 0.9837812185287476, "epoch": 0.7554945054945055, "percentage": 25.18, "elapsed_time": "1:13:17", "remaining_time": "3:37:44"} {"current_steps": 280, "total_steps": 1092, "loss": 0.9847, "lr": 0.00018557176098356405, "epoch": 0.7692307692307693, "percentage": 25.64, "elapsed_time": "1:14:05", "remaining_time": "3:34:51"} {"current_steps": 290, "total_steps": 1092, "loss": 0.9794, "lr": 0.00018387286430813208, "epoch": 0.7967032967032966, "percentage": 26.56, "elapsed_time": "1:15:46", "remaining_time": "3:29:33"} {"current_steps": 300, "total_steps": 1092, "loss": 0.9806, "lr": 0.00018208813326674444, "epoch": 0.8241758241758241, "percentage": 27.47, "elapsed_time": "1:17:26", "remaining_time": "3:24:25"} {"current_steps": 300, "total_steps": 1092, "eval_loss": 0.9748955965042114, "epoch": 0.8241758241758241, "percentage": 27.47, "elapsed_time": "1:19:59", "remaining_time": "3:31:09"} {"current_steps": 310, "total_steps": 1092, "loss": 0.9691, "lr": 0.00018021939432924454, "epoch": 0.8516483516483516, "percentage": 28.39, "elapsed_time": "1:21:37", "remaining_time": "3:25:54"} {"current_steps": 320, "total_steps": 1092, "loss": 0.9666, "lr": 0.00017826855993803147, "epoch": 0.8791208791208791, "percentage": 29.3, "elapsed_time": "1:23:13", "remaining_time": "3:20:45"} {"current_steps": 325, "total_steps": 1092, "eval_loss": 0.9662107229232788, "epoch": 0.8928571428571429, "percentage": 29.76, "elapsed_time": "1:26:34", "remaining_time": "3:24:18"} {"current_steps": 330, "total_steps": 1092, "loss": 0.9528, "lr": 0.00017623762655089207, "epoch": 0.9065934065934066, "percentage": 30.22, "elapsed_time": "1:27:24", "remaining_time": "3:21:50"} {"current_steps": 340, "total_steps": 1092, "loss": 0.9645, "lr": 0.00017412867259785286, "epoch": 0.9340659340659341, "percentage": 31.14, "elapsed_time": "1:29:03", "remaining_time": "3:16:59"} {"current_steps": 350, "total_steps": 1092, "loss": 0.9583, "lr": 0.00017194385635414244, "epoch": 0.9615384615384616, "percentage": 32.05, "elapsed_time": "1:30:41", "remaining_time": "3:12:16"} {"current_steps": 350, "total_steps": 1092, "eval_loss": 0.9582132697105408, "epoch": 0.9615384615384616, "percentage": 32.05, "elapsed_time": "1:33:14", "remaining_time": "3:17:41"} {"current_steps": 360, "total_steps": 1092, "loss": 0.9524, "lr": 0.00016968541373144156, "epoch": 0.989010989010989, "percentage": 32.97, "elapsed_time": "1:34:53", "remaining_time": "3:12:57"} {"current_steps": 370, "total_steps": 1092, "loss": 0.8974, "lr": 0.00016735565598968114, "epoch": 1.0164835164835164, "percentage": 33.88, "elapsed_time": "1:36:34", "remaining_time": "3:08:27"} {"current_steps": 375, "total_steps": 1092, "eval_loss": 0.9573748707771301, "epoch": 1.0302197802197801, "percentage": 34.34, "elapsed_time": "1:39:56", "remaining_time": "3:11:04"} {"current_steps": 380, "total_steps": 1092, "loss": 0.8925, "lr": 0.0001649569673717298, "epoch": 1.043956043956044, "percentage": 34.8, "elapsed_time": "1:40:45", "remaining_time": "3:08:46"} {"current_steps": 390, "total_steps": 1092, "loss": 0.8534, "lr": 0.0001624918026633916, "epoch": 1.0714285714285714, "percentage": 35.71, "elapsed_time": "1:42:25", "remaining_time": "3:04:21"} {"current_steps": 400, "total_steps": 1092, "loss": 0.8835, "lr": 0.00015996268468121102, "epoch": 1.098901098901099, "percentage": 36.63, "elapsed_time": "1:44:06", "remaining_time": "3:00:07"} {"current_steps": 400, "total_steps": 1092, "eval_loss": 0.9542333483695984, "epoch": 1.098901098901099, "percentage": 36.63, "elapsed_time": "1:46:40", "remaining_time": "3:04:32"} {"current_steps": 410, "total_steps": 1092, "loss": 0.882, "lr": 0.00015737220169065655, "epoch": 1.1263736263736264, "percentage": 37.55, "elapsed_time": "1:48:20", "remaining_time": "3:00:13"} {"current_steps": 420, "total_steps": 1092, "loss": 0.8702, "lr": 0.00015472300475732426, "epoch": 1.1538461538461537, "percentage": 38.46, "elapsed_time": "1:50:00", "remaining_time": "2:56:01"} {"current_steps": 425, "total_steps": 1092, "eval_loss": 0.9501178860664368, "epoch": 1.1675824175824177, "percentage": 38.92, "elapsed_time": "1:53:22", "remaining_time": "2:57:55"} {"current_steps": 430, "total_steps": 1092, "loss": 0.8845, "lr": 0.0001520178050338729, "epoch": 1.1813186813186813, "percentage": 39.38, "elapsed_time": "1:54:09", "remaining_time": "2:55:45"} {"current_steps": 440, "total_steps": 1092, "loss": 0.8954, "lr": 0.00014925937098546652, "epoch": 1.2087912087912087, "percentage": 40.29, "elapsed_time": "1:55:50", "remaining_time": "2:51:39"} {"current_steps": 450, "total_steps": 1092, "loss": 0.8682, "lr": 0.00014645052555656431, "epoch": 1.2362637362637363, "percentage": 41.21, "elapsed_time": "1:57:29", "remaining_time": "2:47:37"} {"current_steps": 450, "total_steps": 1092, "eval_loss": 0.9446578025817871, "epoch": 1.2362637362637363, "percentage": 41.21, "elapsed_time": "2:00:02", "remaining_time": "2:51:16"} {"current_steps": 460, "total_steps": 1092, "loss": 0.8782, "lr": 0.00014359414328195703, "epoch": 1.2637362637362637, "percentage": 42.12, "elapsed_time": "2:01:42", "remaining_time": "2:47:12"} {"current_steps": 470, "total_steps": 1092, "loss": 0.8604, "lr": 0.00014069314734500675, "epoch": 1.2912087912087913, "percentage": 43.04, "elapsed_time": "2:03:25", "remaining_time": "2:43:21"} {"current_steps": 475, "total_steps": 1092, "eval_loss": 0.9429782629013062, "epoch": 1.304945054945055, "percentage": 43.5, "elapsed_time": "2:06:49", "remaining_time": "2:44:44"} {"current_steps": 480, "total_steps": 1092, "loss": 0.8556, "lr": 0.00013775050658609988, "epoch": 1.3186813186813187, "percentage": 43.96, "elapsed_time": "2:07:40", "remaining_time": "2:42:46"} {"current_steps": 490, "total_steps": 1092, "loss": 0.8704, "lr": 0.0001347692324643759, "epoch": 1.3461538461538463, "percentage": 44.87, "elapsed_time": "2:09:20", "remaining_time": "2:38:54"} {"current_steps": 500, "total_steps": 1092, "loss": 0.8778, "lr": 0.00013175237597584045, "epoch": 1.3736263736263736, "percentage": 45.79, "elapsed_time": "2:10:58", "remaining_time": "2:35:04"} {"current_steps": 500, "total_steps": 1092, "eval_loss": 0.9382254481315613, "epoch": 1.3736263736263736, "percentage": 45.79, "elapsed_time": "2:13:31", "remaining_time": "2:38:06"} {"current_steps": 510, "total_steps": 1092, "loss": 0.8634, "lr": 0.00012870302453101657, "epoch": 1.401098901098901, "percentage": 46.7, "elapsed_time": "2:15:07", "remaining_time": "2:34:12"} {"current_steps": 520, "total_steps": 1092, "loss": 0.8659, "lr": 0.0001256242987953306, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "2:16:49", "remaining_time": "2:30:30"} {"current_steps": 525, "total_steps": 1092, "eval_loss": 0.9333315491676331, "epoch": 1.4423076923076923, "percentage": 48.08, "elapsed_time": "2:20:14", "remaining_time": "2:31:27"} {"current_steps": 530, "total_steps": 1092, "loss": 0.8686, "lr": 0.00012251934949546447, "epoch": 1.456043956043956, "percentage": 48.53, "elapsed_time": "2:21:03", "remaining_time": "2:29:34"} {"current_steps": 540, "total_steps": 1092, "loss": 0.8718, "lr": 0.00011939135419494456, "epoch": 1.4835164835164836, "percentage": 49.45, "elapsed_time": "2:22:44", "remaining_time": "2:25:54"} {"current_steps": 550, "total_steps": 1092, "loss": 0.862, "lr": 0.00011624351404226572, "epoch": 1.510989010989011, "percentage": 50.37, "elapsed_time": "2:24:22", "remaining_time": "2:22:16"} {"current_steps": 550, "total_steps": 1092, "eval_loss": 0.9310413599014282, "epoch": 1.510989010989011, "percentage": 50.37, "elapsed_time": "2:26:55", "remaining_time": "2:24:47"} {"current_steps": 560, "total_steps": 1092, "loss": 0.8614, "lr": 0.00011307905049487855, "epoch": 1.5384615384615383, "percentage": 51.28, "elapsed_time": "2:28:32", "remaining_time": "2:21:07"} {"current_steps": 570, "total_steps": 1092, "loss": 0.8625, "lr": 0.00010990120202239324, "epoch": 1.565934065934066, "percentage": 52.2, "elapsed_time": "2:30:14", "remaining_time": "2:17:35"} {"current_steps": 575, "total_steps": 1092, "eval_loss": 0.9275878071784973, "epoch": 1.5796703296703298, "percentage": 52.66, "elapsed_time": "2:33:40", "remaining_time": "2:18:10"} {"current_steps": 580, "total_steps": 1092, "loss": 0.8747, "lr": 0.00010671322079237307, "epoch": 1.5934065934065935, "percentage": 53.11, "elapsed_time": "2:34:27", "remaining_time": "2:16:21"} {"current_steps": 590, "total_steps": 1092, "loss": 0.8656, "lr": 0.00010351836934210957, "epoch": 1.620879120879121, "percentage": 54.03, "elapsed_time": "2:36:07", "remaining_time": "2:12:50"} {"current_steps": 600, "total_steps": 1092, "loss": 0.848, "lr": 0.00010031991723978574, "epoch": 1.6483516483516483, "percentage": 54.95, "elapsed_time": "2:37:44", "remaining_time": "2:09:20"} {"current_steps": 600, "total_steps": 1092, "eval_loss": 0.924781322479248, "epoch": 1.6483516483516483, "percentage": 54.95, "elapsed_time": "2:40:17", "remaining_time": "2:11:26"} {"current_steps": 610, "total_steps": 1092, "loss": 0.8641, "lr": 9.712113773844361e-05, "epoch": 1.6758241758241759, "percentage": 55.86, "elapsed_time": "2:41:57", "remaining_time": "2:07:58"} {"current_steps": 620, "total_steps": 1092, "loss": 0.8662, "lr": 9.3925304426181e-05, "epoch": 1.7032967032967035, "percentage": 56.78, "elapsed_time": "2:43:35", "remaining_time": "2:04:32"} {"current_steps": 625, "total_steps": 1092, "eval_loss": 0.9215436577796936, "epoch": 1.7170329670329672, "percentage": 57.23, "elapsed_time": "2:46:55", "remaining_time": "2:04:43"} {"current_steps": 630, "total_steps": 1092, "loss": 0.8751, "lr": 9.073568787600539e-05, "epoch": 1.7307692307692308, "percentage": 57.69, "elapsed_time": "2:47:49", "remaining_time": "2:03:04"} {"current_steps": 640, "total_steps": 1092, "loss": 0.859, "lr": 8.755555229877294e-05, "epoch": 1.7582417582417582, "percentage": 58.61, "elapsed_time": "2:49:26", "remaining_time": "1:59:39"} {"current_steps": 650, "total_steps": 1092, "loss": 0.8438, "lr": 8.438815220263941e-05, "epoch": 1.7857142857142856, "percentage": 59.52, "elapsed_time": "2:51:02", "remaining_time": "1:56:18"} {"current_steps": 650, "total_steps": 1092, "eval_loss": 0.919314444065094, "epoch": 1.7857142857142856, "percentage": 59.52, "elapsed_time": "2:53:35", "remaining_time": "1:58:02"} {"current_steps": 660, "total_steps": 1092, "loss": 0.8619, "lr": 8.123672906243955e-05, "epoch": 1.8131868131868132, "percentage": 60.44, "elapsed_time": "2:55:12", "remaining_time": "1:54:41"} {"current_steps": 670, "total_steps": 1092, "loss": 0.8457, "lr": 7.810450800240549e-05, "epoch": 1.8406593406593408, "percentage": 61.36, "elapsed_time": "2:56:53", "remaining_time": "1:51:25"} {"current_steps": 675, "total_steps": 1092, "eval_loss": 0.9163983464241028, "epoch": 1.8543956043956045, "percentage": 61.81, "elapsed_time": "3:00:14", "remaining_time": "1:51:20"} {"current_steps": 680, "total_steps": 1092, "loss": 0.8548, "lr": 7.499469449561769e-05, "epoch": 1.8681318681318682, "percentage": 62.27, "elapsed_time": "3:01:04", "remaining_time": "1:49:42"} {"current_steps": 690, "total_steps": 1092, "loss": 0.8776, "lr": 7.191047108356672e-05, "epoch": 1.8956043956043955, "percentage": 63.19, "elapsed_time": "3:02:44", "remaining_time": "1:46:28"} {"current_steps": 700, "total_steps": 1092, "loss": 0.8629, "lr": 6.885499411918304e-05, "epoch": 1.9230769230769231, "percentage": 64.1, "elapsed_time": "3:04:23", "remaining_time": "1:43:15"} {"current_steps": 700, "total_steps": 1092, "eval_loss": 0.9145733118057251, "epoch": 1.9230769230769231, "percentage": 64.1, "elapsed_time": "3:06:56", "remaining_time": "1:44:41"} {"current_steps": 710, "total_steps": 1092, "loss": 0.8534, "lr": 6.583139053666745e-05, "epoch": 1.9505494505494505, "percentage": 65.02, "elapsed_time": "3:08:37", "remaining_time": "1:41:28"} {"current_steps": 720, "total_steps": 1092, "loss": 0.8401, "lr": 6.284275465142874e-05, "epoch": 1.978021978021978, "percentage": 65.93, "elapsed_time": "3:10:14", "remaining_time": "1:38:17"} {"current_steps": 725, "total_steps": 1092, "eval_loss": 0.912276566028595, "epoch": 1.9917582417582418, "percentage": 66.39, "elapsed_time": "3:13:36", "remaining_time": "1:38:00"} {"current_steps": 730, "total_steps": 1092, "loss": 0.8125, "lr": 5.989214499340267e-05, "epoch": 2.0054945054945055, "percentage": 66.85, "elapsed_time": "3:14:23", "remaining_time": "1:36:23"} {"current_steps": 740, "total_steps": 1092, "loss": 0.7576, "lr": 5.6982581176993335e-05, "epoch": 2.032967032967033, "percentage": 67.77, "elapsed_time": "3:16:00", "remaining_time": "1:33:14"} {"current_steps": 750, "total_steps": 1092, "loss": 0.7507, "lr": 5.4117040810840246e-05, "epoch": 2.0604395604395602, "percentage": 68.68, "elapsed_time": "3:17:36", "remaining_time": "1:30:06"} {"current_steps": 750, "total_steps": 1092, "eval_loss": 0.9363195300102234, "epoch": 2.0604395604395602, "percentage": 68.68, "elapsed_time": "3:20:09", "remaining_time": "1:31:16"} {"current_steps": 760, "total_steps": 1092, "loss": 0.7568, "lr": 5.129845645057372e-05, "epoch": 2.087912087912088, "percentage": 69.6, "elapsed_time": "3:21:48", "remaining_time": "1:28:09"} {"current_steps": 770, "total_steps": 1092, "loss": 0.7442, "lr": 4.8529712597676426e-05, "epoch": 2.1153846153846154, "percentage": 70.51, "elapsed_time": "3:23:27", "remaining_time": "1:25:04"} {"current_steps": 775, "total_steps": 1092, "eval_loss": 0.9283037781715393, "epoch": 2.129120879120879, "percentage": 70.97, "elapsed_time": "3:26:52", "remaining_time": "1:24:37"} {"current_steps": 780, "total_steps": 1092, "loss": 0.7643, "lr": 4.581364274752338e-05, "epoch": 2.142857142857143, "percentage": 71.43, "elapsed_time": "3:27:42", "remaining_time": "1:23:05"} {"current_steps": 790, "total_steps": 1092, "loss": 0.7394, "lr": 4.315302648962066e-05, "epoch": 2.17032967032967, "percentage": 72.34, "elapsed_time": "3:29:18", "remaining_time": "1:20:00"} {"current_steps": 800, "total_steps": 1092, "loss": 0.7561, "lr": 4.055058666301087e-05, "epoch": 2.197802197802198, "percentage": 73.26, "elapsed_time": "3:31:00", "remaining_time": "1:17:00"} {"current_steps": 800, "total_steps": 1092, "eval_loss": 0.9290263652801514, "epoch": 2.197802197802198, "percentage": 73.26, "elapsed_time": "3:33:33", "remaining_time": "1:17:56"} {"current_steps": 810, "total_steps": 1092, "loss": 0.7534, "lr": 3.800898656975599e-05, "epoch": 2.2252747252747254, "percentage": 74.18, "elapsed_time": "3:35:14", "remaining_time": "1:14:56"} {"current_steps": 820, "total_steps": 1092, "loss": 0.759, "lr": 3.553082724934973e-05, "epoch": 2.2527472527472527, "percentage": 75.09, "elapsed_time": "3:36:49", "remaining_time": "1:11:55"} {"current_steps": 825, "total_steps": 1092, "eval_loss": 0.9296738505363464, "epoch": 2.2664835164835164, "percentage": 75.55, "elapsed_time": "3:40:10", "remaining_time": "1:11:15"} {"current_steps": 830, "total_steps": 1092, "loss": 0.75, "lr": 3.3118644816848574e-05, "epoch": 2.28021978021978, "percentage": 76.01, "elapsed_time": "3:41:01", "remaining_time": "1:09:46"} {"current_steps": 840, "total_steps": 1092, "loss": 0.7616, "lr": 3.077490786744562e-05, "epoch": 2.3076923076923075, "percentage": 76.92, "elapsed_time": "3:42:35", "remaining_time": "1:06:46"} {"current_steps": 850, "total_steps": 1092, "loss": 0.756, "lr": 2.8502014950143373e-05, "epoch": 2.3351648351648353, "percentage": 77.84, "elapsed_time": "3:44:13", "remaining_time": "1:03:50"} {"current_steps": 850, "total_steps": 1092, "eval_loss": 0.9292080998420715, "epoch": 2.3351648351648353, "percentage": 77.84, "elapsed_time": "3:46:46", "remaining_time": "1:04:33"} {"current_steps": 860, "total_steps": 1092, "loss": 0.748, "lr": 2.6302292113110637e-05, "epoch": 2.3626373626373627, "percentage": 78.75, "elapsed_time": "3:48:22", "remaining_time": "1:01:36"} {"current_steps": 870, "total_steps": 1092, "loss": 0.7568, "lr": 2.4177990523236216e-05, "epoch": 2.39010989010989, "percentage": 79.67, "elapsed_time": "3:50:01", "remaining_time": "0:58:41"} {"current_steps": 875, "total_steps": 1092, "eval_loss": 0.9285762310028076, "epoch": 2.4038461538461537, "percentage": 80.13, "elapsed_time": "3:53:24", "remaining_time": "0:57:53"} {"current_steps": 880, "total_steps": 1092, "loss": 0.7543, "lr": 2.213128416231468e-05, "epoch": 2.4175824175824174, "percentage": 80.59, "elapsed_time": "3:54:12", "remaining_time": "0:56:25"} {"current_steps": 890, "total_steps": 1092, "loss": 0.7547, "lr": 2.0164267602222586e-05, "epoch": 2.4450549450549453, "percentage": 81.5, "elapsed_time": "3:55:52", "remaining_time": "0:53:32"} {"current_steps": 900, "total_steps": 1092, "loss": 0.7555, "lr": 1.827895386136166e-05, "epoch": 2.4725274725274726, "percentage": 82.42, "elapsed_time": "3:57:33", "remaining_time": "0:50:40"} {"current_steps": 900, "total_steps": 1092, "eval_loss": 0.9276696443557739, "epoch": 2.4725274725274726, "percentage": 82.42, "elapsed_time": "4:00:06", "remaining_time": "0:51:13"} {"current_steps": 910, "total_steps": 1092, "loss": 0.7639, "lr": 1.647727234456279e-05, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "4:01:45", "remaining_time": "0:48:21"} {"current_steps": 920, "total_steps": 1092, "loss": 0.7489, "lr": 1.4761066868558914e-05, "epoch": 2.5274725274725274, "percentage": 84.25, "elapsed_time": "4:03:21", "remaining_time": "0:45:29"} {"current_steps": 925, "total_steps": 1092, "eval_loss": 0.9275524020195007, "epoch": 2.541208791208791, "percentage": 84.71, "elapsed_time": "4:06:46", "remaining_time": "0:44:33"} {"current_steps": 930, "total_steps": 1092, "loss": 0.7487, "lr": 1.3132093775047615e-05, "epoch": 2.5549450549450547, "percentage": 85.16, "elapsed_time": "4:07:33", "remaining_time": "0:43:07"} {"current_steps": 940, "total_steps": 1092, "loss": 0.7635, "lr": 1.1592020133274639e-05, "epoch": 2.5824175824175826, "percentage": 86.08, "elapsed_time": "4:09:11", "remaining_time": "0:40:17"} {"current_steps": 950, "total_steps": 1092, "loss": 0.752, "lr": 1.0142422033977505e-05, "epoch": 2.60989010989011, "percentage": 87.0, "elapsed_time": "4:10:52", "remaining_time": "0:37:29"} {"current_steps": 950, "total_steps": 1092, "eval_loss": 0.9266554117202759, "epoch": 2.60989010989011, "percentage": 87.0, "elapsed_time": "4:13:25", "remaining_time": "0:37:52"} {"current_steps": 960, "total_steps": 1092, "loss": 0.745, "lr": 8.784782976435424e-06, "epoch": 2.6373626373626373, "percentage": 87.91, "elapsed_time": "4:15:05", "remaining_time": "0:35:04"} {"current_steps": 970, "total_steps": 1092, "loss": 0.7443, "lr": 7.520492350275876e-06, "epoch": 2.6648351648351647, "percentage": 88.83, "elapsed_time": "4:16:46", "remaining_time": "0:32:17"} {"current_steps": 975, "total_steps": 1092, "eval_loss": 0.9264477491378784, "epoch": 2.678571428571429, "percentage": 89.29, "elapsed_time": "4:20:09", "remaining_time": "0:31:13"} {"current_steps": 980, "total_steps": 1092, "loss": 0.7527, "lr": 6.350844013592061e-06, "epoch": 2.6923076923076925, "percentage": 89.74, "elapsed_time": "4:20:57", "remaining_time": "0:29:49"} {"current_steps": 990, "total_steps": 1092, "loss": 0.7635, "lr": 5.277034968825667e-06, "epoch": 2.71978021978022, "percentage": 90.66, "elapsed_time": "4:22:36", "remaining_time": "0:27:03"} {"current_steps": 1000, "total_steps": 1092, "loss": 0.7477, "lr": 4.3001641377707125e-06, "epoch": 2.7472527472527473, "percentage": 91.58, "elapsed_time": "4:24:15", "remaining_time": "0:24:18"} {"current_steps": 1000, "total_steps": 1092, "eval_loss": 0.9256552457809448, "epoch": 2.7472527472527473, "percentage": 91.58, "elapsed_time": "4:26:49", "remaining_time": "0:24:32"} {"current_steps": 1010, "total_steps": 1092, "loss": 0.7328, "lr": 3.4212312369516497e-06, "epoch": 2.7747252747252746, "percentage": 92.49, "elapsed_time": "4:28:28", "remaining_time": "0:21:47"} {"current_steps": 1020, "total_steps": 1092, "loss": 0.7496, "lr": 2.6411357545269577e-06, "epoch": 2.802197802197802, "percentage": 93.41, "elapsed_time": "4:30:09", "remaining_time": "0:19:04"} {"current_steps": 1025, "total_steps": 1092, "eval_loss": 0.9259692430496216, "epoch": 2.8159340659340657, "percentage": 93.86, "elapsed_time": "4:33:35", "remaining_time": "0:17:52"} {"current_steps": 1030, "total_steps": 1092, "loss": 0.7651, "lr": 1.960676029764874e-06, "epoch": 2.82967032967033, "percentage": 94.32, "elapsed_time": "4:34:23", "remaining_time": "0:16:30"} {"current_steps": 1040, "total_steps": 1092, "loss": 0.7364, "lr": 1.3805484360337906e-06, "epoch": 2.857142857142857, "percentage": 95.24, "elapsed_time": "4:36:04", "remaining_time": "0:13:48"} {"current_steps": 1050, "total_steps": 1092, "loss": 0.7417, "lr": 9.013466681429994e-07, "epoch": 2.8846153846153846, "percentage": 96.15, "elapsed_time": "4:37:44", "remaining_time": "0:11:06"} {"current_steps": 1050, "total_steps": 1092, "eval_loss": 0.9257997274398804, "epoch": 2.8846153846153846, "percentage": 96.15, "elapsed_time": "4:40:17", "remaining_time": "0:11:12"} {"current_steps": 1060, "total_steps": 1092, "loss": 0.737, "lr": 5.235611347634172e-07, "epoch": 2.912087912087912, "percentage": 97.07, "elapsed_time": "4:41:56", "remaining_time": "0:08:30"} {"current_steps": 1070, "total_steps": 1092, "loss": 0.7438, "lr": 2.4757845654992397e-07, "epoch": 2.9395604395604398, "percentage": 97.99, "elapsed_time": "4:43:35", "remaining_time": "0:05:49"} {"current_steps": 1075, "total_steps": 1092, "eval_loss": 0.9256556034088135, "epoch": 2.9532967032967035, "percentage": 98.44, "elapsed_time": "4:46:59", "remaining_time": "0:04:32"} {"current_steps": 1080, "total_steps": 1092, "loss": 0.7651, "lr": 7.368107047894812e-08, "epoch": 2.967032967032967, "percentage": 98.9, "elapsed_time": "4:47:48", "remaining_time": "0:03:11"} {"current_steps": 1090, "total_steps": 1092, "loss": 0.7437, "lr": 2.046940806244013e-09, "epoch": 2.9945054945054945, "percentage": 99.82, "elapsed_time": "4:49:28", "remaining_time": "0:00:31"} {"current_steps": 1092, "total_steps": 1092, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "4:49:47", "remaining_time": "0:00:00"}