diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -32341,3 +32341,1800 @@ {"current_steps": 161620, "total_steps": 179580, "loss": 0.6252, "lr": 1.5081831318557533e-06, "epoch": 17.999777258046553, "percentage": 90.0, "elapsed_time": "16:16:52", "remaining_time": "1:48:33", "throughput": 3353.16, "total_tokens": 196535136} {"current_steps": 161622, "total_steps": 179580, "eval_loss": 0.7087222337722778, "epoch": 18.0, "percentage": 90.0, "elapsed_time": "16:18:42", "remaining_time": "1:48:44", "throughput": 3346.88, "total_tokens": 196536784} {"current_steps": 161625, "total_steps": 179580, "loss": 0.9427, "lr": 1.5073520903972904e-06, "epoch": 18.00033411293017, "percentage": 90.0, "elapsed_time": "16:18:45", "remaining_time": "1:48:43", "throughput": 3346.76, "total_tokens": 196540432} +{"current_steps": 161630, "total_steps": 179580, "loss": 0.902, "lr": 1.5065212708457094e-06, "epoch": 18.00089096781379, "percentage": 90.0, "elapsed_time": "16:18:47", "remaining_time": "1:48:42", "throughput": 3346.76, "total_tokens": 196546672} +{"current_steps": 161635, "total_steps": 179580, "loss": 0.6867, "lr": 1.5056906732088565e-06, "epoch": 18.001447822697404, "percentage": 90.01, "elapsed_time": "16:18:49", "remaining_time": "1:48:40", "throughput": 3346.77, "total_tokens": 196552816} +{"current_steps": 161640, "total_steps": 179580, "loss": 0.8089, "lr": 1.5048602974945758e-06, "epoch": 18.002004677581024, "percentage": 90.01, "elapsed_time": "16:18:50", "remaining_time": "1:48:38", "throughput": 3346.77, "total_tokens": 196558704} +{"current_steps": 161645, "total_steps": 179580, "loss": 0.65, "lr": 1.5040301437107162e-06, "epoch": 18.00256153246464, "percentage": 90.01, "elapsed_time": "16:18:52", "remaining_time": "1:48:36", "throughput": 3346.77, "total_tokens": 196564560} +{"current_steps": 161650, "total_steps": 179580, "loss": 0.7165, "lr": 1.5032002118651134e-06, "epoch": 18.003118387348255, "percentage": 90.02, "elapsed_time": "16:18:54", "remaining_time": "1:48:34", "throughput": 3346.77, "total_tokens": 196570064} +{"current_steps": 161655, "total_steps": 179580, "loss": 0.9194, "lr": 1.5023705019656138e-06, "epoch": 18.003675242231875, "percentage": 90.02, "elapsed_time": "16:18:55", "remaining_time": "1:48:32", "throughput": 3346.77, "total_tokens": 196575920} +{"current_steps": 161660, "total_steps": 179580, "loss": 0.969, "lr": 1.5015410140200553e-06, "epoch": 18.00423209711549, "percentage": 90.02, "elapsed_time": "16:18:57", "remaining_time": "1:48:31", "throughput": 3346.78, "total_tokens": 196581872} +{"current_steps": 161665, "total_steps": 179580, "loss": 0.7433, "lr": 1.5007117480362597e-06, "epoch": 18.00478895199911, "percentage": 90.02, "elapsed_time": "16:18:59", "remaining_time": "1:48:29", "throughput": 3346.78, "total_tokens": 196587440} +{"current_steps": 161670, "total_steps": 179580, "loss": 0.6137, "lr": 1.4998827040220736e-06, "epoch": 18.005345806882726, "percentage": 90.03, "elapsed_time": "16:19:01", "remaining_time": "1:48:27", "throughput": 3346.78, "total_tokens": 196593392} +{"current_steps": 161675, "total_steps": 179580, "loss": 0.635, "lr": 1.4990538819853183e-06, "epoch": 18.005902661766342, "percentage": 90.03, "elapsed_time": "16:19:02", "remaining_time": "1:48:25", "throughput": 3346.79, "total_tokens": 196599376} +{"current_steps": 161680, "total_steps": 179580, "loss": 0.6598, "lr": 1.4982252819338322e-06, "epoch": 18.00645951664996, "percentage": 90.03, "elapsed_time": "16:19:04", "remaining_time": "1:48:23", "throughput": 3346.79, "total_tokens": 196605360} +{"current_steps": 161685, "total_steps": 179580, "loss": 0.7061, "lr": 1.4973969038754392e-06, "epoch": 18.007016371533577, "percentage": 90.04, "elapsed_time": "16:19:06", "remaining_time": "1:48:21", "throughput": 3346.79, "total_tokens": 196611344} +{"current_steps": 161690, "total_steps": 179580, "loss": 0.6742, "lr": 1.4965687478179613e-06, "epoch": 18.007573226417197, "percentage": 90.04, "elapsed_time": "16:19:07", "remaining_time": "1:48:20", "throughput": 3346.8, "total_tokens": 196617360} +{"current_steps": 161695, "total_steps": 179580, "loss": 0.8384, "lr": 1.495740813769217e-06, "epoch": 18.008130081300813, "percentage": 90.04, "elapsed_time": "16:19:09", "remaining_time": "1:48:18", "throughput": 3346.8, "total_tokens": 196622704} +{"current_steps": 161700, "total_steps": 179580, "loss": 0.7037, "lr": 1.494913101737036e-06, "epoch": 18.00868693618443, "percentage": 90.04, "elapsed_time": "16:19:11", "remaining_time": "1:48:16", "throughput": 3346.8, "total_tokens": 196628336} +{"current_steps": 161705, "total_steps": 179580, "loss": 1.0197, "lr": 1.4940856117292346e-06, "epoch": 18.009243791068048, "percentage": 90.05, "elapsed_time": "16:19:12", "remaining_time": "1:48:14", "throughput": 3346.8, "total_tokens": 196634224} +{"current_steps": 161710, "total_steps": 179580, "loss": 0.4129, "lr": 1.4932583437536257e-06, "epoch": 18.009800645951664, "percentage": 90.05, "elapsed_time": "16:19:14", "remaining_time": "1:48:12", "throughput": 3346.81, "total_tokens": 196640176} +{"current_steps": 161715, "total_steps": 179580, "loss": 0.962, "lr": 1.4924312978180227e-06, "epoch": 18.010357500835283, "percentage": 90.05, "elapsed_time": "16:19:16", "remaining_time": "1:48:10", "throughput": 3346.81, "total_tokens": 196646320} +{"current_steps": 161720, "total_steps": 179580, "loss": 0.6698, "lr": 1.4916044739302415e-06, "epoch": 18.0109143557189, "percentage": 90.05, "elapsed_time": "16:19:18", "remaining_time": "1:48:09", "throughput": 3346.81, "total_tokens": 196652624} +{"current_steps": 161725, "total_steps": 179580, "loss": 0.7189, "lr": 1.4907778720980898e-06, "epoch": 18.011471210602515, "percentage": 90.06, "elapsed_time": "16:19:19", "remaining_time": "1:48:07", "throughput": 3346.82, "total_tokens": 196658960} +{"current_steps": 161730, "total_steps": 179580, "loss": 0.7919, "lr": 1.4899514923293806e-06, "epoch": 18.012028065486135, "percentage": 90.06, "elapsed_time": "16:19:21", "remaining_time": "1:48:05", "throughput": 3346.82, "total_tokens": 196665104} +{"current_steps": 161735, "total_steps": 179580, "loss": 0.8081, "lr": 1.4891253346319106e-06, "epoch": 18.01258492036975, "percentage": 90.06, "elapsed_time": "16:19:23", "remaining_time": "1:48:03", "throughput": 3346.83, "total_tokens": 196671248} +{"current_steps": 161740, "total_steps": 179580, "loss": 0.8347, "lr": 1.488299399013493e-06, "epoch": 18.01314177525337, "percentage": 90.07, "elapsed_time": "16:19:25", "remaining_time": "1:48:01", "throughput": 3346.83, "total_tokens": 196677296} +{"current_steps": 161745, "total_steps": 179580, "loss": 0.8727, "lr": 1.4874736854819189e-06, "epoch": 18.013698630136986, "percentage": 90.07, "elapsed_time": "16:19:26", "remaining_time": "1:48:00", "throughput": 3346.83, "total_tokens": 196683152} +{"current_steps": 161750, "total_steps": 179580, "loss": 0.8339, "lr": 1.4866481940449984e-06, "epoch": 18.014255485020605, "percentage": 90.07, "elapsed_time": "16:19:28", "remaining_time": "1:47:58", "throughput": 3346.84, "total_tokens": 196689680} +{"current_steps": 161755, "total_steps": 179580, "loss": 0.7696, "lr": 1.4858229247105225e-06, "epoch": 18.01481233990422, "percentage": 90.07, "elapsed_time": "16:19:30", "remaining_time": "1:47:56", "throughput": 3346.84, "total_tokens": 196695664} +{"current_steps": 161760, "total_steps": 179580, "loss": 0.898, "lr": 1.4849978774862911e-06, "epoch": 18.015369194787837, "percentage": 90.08, "elapsed_time": "16:19:32", "remaining_time": "1:47:54", "throughput": 3346.84, "total_tokens": 196701392} +{"current_steps": 161765, "total_steps": 179580, "loss": 0.5354, "lr": 1.4841730523800889e-06, "epoch": 18.015926049671457, "percentage": 90.08, "elapsed_time": "16:19:33", "remaining_time": "1:47:52", "throughput": 3346.85, "total_tokens": 196707216} +{"current_steps": 161770, "total_steps": 179580, "loss": 0.6725, "lr": 1.4833484493997156e-06, "epoch": 18.016482904555073, "percentage": 90.08, "elapsed_time": "16:19:35", "remaining_time": "1:47:50", "throughput": 3346.85, "total_tokens": 196713424} +{"current_steps": 161775, "total_steps": 179580, "loss": 0.8138, "lr": 1.4825240685529595e-06, "epoch": 18.017039759438692, "percentage": 90.09, "elapsed_time": "16:19:37", "remaining_time": "1:47:49", "throughput": 3346.85, "total_tokens": 196719344} +{"current_steps": 161780, "total_steps": 179580, "loss": 0.6228, "lr": 1.4816999098476059e-06, "epoch": 18.017596614322308, "percentage": 90.09, "elapsed_time": "16:19:39", "remaining_time": "1:47:47", "throughput": 3346.86, "total_tokens": 196725488} +{"current_steps": 161785, "total_steps": 179580, "loss": 0.5287, "lr": 1.4808759732914347e-06, "epoch": 18.018153469205924, "percentage": 90.09, "elapsed_time": "16:19:41", "remaining_time": "1:47:45", "throughput": 3346.86, "total_tokens": 196731792} +{"current_steps": 161790, "total_steps": 179580, "loss": 0.8316, "lr": 1.4800522588922366e-06, "epoch": 18.018710324089543, "percentage": 90.09, "elapsed_time": "16:19:42", "remaining_time": "1:47:43", "throughput": 3346.86, "total_tokens": 196737008} +{"current_steps": 161795, "total_steps": 179580, "loss": 0.9738, "lr": 1.4792287666577864e-06, "epoch": 18.01926717897316, "percentage": 90.1, "elapsed_time": "16:19:44", "remaining_time": "1:47:41", "throughput": 3346.87, "total_tokens": 196743152} +{"current_steps": 161800, "total_steps": 179580, "loss": 0.5984, "lr": 1.4784054965958666e-06, "epoch": 18.01982403385678, "percentage": 90.1, "elapsed_time": "16:19:46", "remaining_time": "1:47:39", "throughput": 3346.87, "total_tokens": 196749584} +{"current_steps": 161805, "total_steps": 179580, "loss": 0.5238, "lr": 1.4775824487142515e-06, "epoch": 18.020380888740394, "percentage": 90.1, "elapsed_time": "16:19:47", "remaining_time": "1:47:38", "throughput": 3346.87, "total_tokens": 196755216} +{"current_steps": 161810, "total_steps": 179580, "loss": 0.6291, "lr": 1.4767596230207182e-06, "epoch": 18.02093774362401, "percentage": 90.1, "elapsed_time": "16:19:49", "remaining_time": "1:47:36", "throughput": 3346.88, "total_tokens": 196761296} +{"current_steps": 161815, "total_steps": 179580, "loss": 0.6596, "lr": 1.4759370195230327e-06, "epoch": 18.02149459850763, "percentage": 90.11, "elapsed_time": "16:19:51", "remaining_time": "1:47:34", "throughput": 3346.88, "total_tokens": 196767472} +{"current_steps": 161820, "total_steps": 179580, "loss": 0.7553, "lr": 1.475114638228972e-06, "epoch": 18.022051453391246, "percentage": 90.11, "elapsed_time": "16:19:52", "remaining_time": "1:47:32", "throughput": 3346.88, "total_tokens": 196773040} +{"current_steps": 161825, "total_steps": 179580, "loss": 0.6241, "lr": 1.4742924791463024e-06, "epoch": 18.022608308274865, "percentage": 90.11, "elapsed_time": "16:19:54", "remaining_time": "1:47:30", "throughput": 3346.89, "total_tokens": 196779056} +{"current_steps": 161830, "total_steps": 179580, "loss": 0.8791, "lr": 1.4734705422827898e-06, "epoch": 18.02316516315848, "percentage": 90.12, "elapsed_time": "16:19:56", "remaining_time": "1:47:28", "throughput": 3346.89, "total_tokens": 196785008} +{"current_steps": 161835, "total_steps": 179580, "loss": 0.7082, "lr": 1.472648827646192e-06, "epoch": 18.023722018042097, "percentage": 90.12, "elapsed_time": "16:19:58", "remaining_time": "1:47:27", "throughput": 3346.89, "total_tokens": 196790928} +{"current_steps": 161840, "total_steps": 179580, "loss": 0.7366, "lr": 1.4718273352442773e-06, "epoch": 18.024278872925716, "percentage": 90.12, "elapsed_time": "16:19:59", "remaining_time": "1:47:25", "throughput": 3346.9, "total_tokens": 196796944} +{"current_steps": 161845, "total_steps": 179580, "loss": 0.5987, "lr": 1.471006065084804e-06, "epoch": 18.024835727809332, "percentage": 90.12, "elapsed_time": "16:20:01", "remaining_time": "1:47:23", "throughput": 3346.9, "total_tokens": 196803120} +{"current_steps": 161850, "total_steps": 179580, "loss": 0.6349, "lr": 1.470185017175535e-06, "epoch": 18.02539258269295, "percentage": 90.13, "elapsed_time": "16:20:03", "remaining_time": "1:47:21", "throughput": 3346.9, "total_tokens": 196809456} +{"current_steps": 161855, "total_steps": 179580, "loss": 0.5558, "lr": 1.4693641915242112e-06, "epoch": 18.025949437576568, "percentage": 90.13, "elapsed_time": "16:20:05", "remaining_time": "1:47:19", "throughput": 3346.9, "total_tokens": 196814832} +{"current_steps": 161860, "total_steps": 179580, "loss": 0.6503, "lr": 1.4685435881386016e-06, "epoch": 18.026506292460184, "percentage": 90.13, "elapsed_time": "16:20:06", "remaining_time": "1:47:18", "throughput": 3346.91, "total_tokens": 196821008} +{"current_steps": 161865, "total_steps": 179580, "loss": 0.7213, "lr": 1.4677232070264473e-06, "epoch": 18.027063147343803, "percentage": 90.14, "elapsed_time": "16:20:08", "remaining_time": "1:47:16", "throughput": 3346.91, "total_tokens": 196827088} +{"current_steps": 161870, "total_steps": 179580, "loss": 0.7107, "lr": 1.4669030481955032e-06, "epoch": 18.02762000222742, "percentage": 90.14, "elapsed_time": "16:20:10", "remaining_time": "1:47:14", "throughput": 3346.92, "total_tokens": 196833168} +{"current_steps": 161875, "total_steps": 179580, "loss": 0.9948, "lr": 1.4660831116535156e-06, "epoch": 18.02817685711104, "percentage": 90.14, "elapsed_time": "16:20:12", "remaining_time": "1:47:12", "throughput": 3346.92, "total_tokens": 196839472} +{"current_steps": 161880, "total_steps": 179580, "loss": 0.6326, "lr": 1.465263397408226e-06, "epoch": 18.028733711994654, "percentage": 90.14, "elapsed_time": "16:20:13", "remaining_time": "1:47:10", "throughput": 3346.92, "total_tokens": 196845840} +{"current_steps": 161885, "total_steps": 179580, "loss": 0.9608, "lr": 1.4644439054673776e-06, "epoch": 18.02929056687827, "percentage": 90.15, "elapsed_time": "16:20:15", "remaining_time": "1:47:08", "throughput": 3346.93, "total_tokens": 196851280} +{"current_steps": 161890, "total_steps": 179580, "loss": 0.8128, "lr": 1.4636246358387146e-06, "epoch": 18.02984742176189, "percentage": 90.15, "elapsed_time": "16:20:17", "remaining_time": "1:47:07", "throughput": 3346.93, "total_tokens": 196857168} +{"current_steps": 161895, "total_steps": 179580, "loss": 0.6243, "lr": 1.4628055885299751e-06, "epoch": 18.030404276645505, "percentage": 90.15, "elapsed_time": "16:20:19", "remaining_time": "1:47:05", "throughput": 3346.93, "total_tokens": 196863440} +{"current_steps": 161900, "total_steps": 179580, "loss": 0.7461, "lr": 1.4619867635488948e-06, "epoch": 18.030961131529125, "percentage": 90.15, "elapsed_time": "16:20:20", "remaining_time": "1:47:03", "throughput": 3346.94, "total_tokens": 196869872} +{"current_steps": 161905, "total_steps": 179580, "loss": 0.5409, "lr": 1.4611681609032035e-06, "epoch": 18.03151798641274, "percentage": 90.16, "elapsed_time": "16:20:22", "remaining_time": "1:47:01", "throughput": 3346.94, "total_tokens": 196875856} +{"current_steps": 161910, "total_steps": 179580, "loss": 0.5226, "lr": 1.4603497806006423e-06, "epoch": 18.032074841296357, "percentage": 90.16, "elapsed_time": "16:20:24", "remaining_time": "1:46:59", "throughput": 3346.94, "total_tokens": 196882064} +{"current_steps": 161915, "total_steps": 179580, "loss": 0.7877, "lr": 1.4595316226489353e-06, "epoch": 18.032631696179976, "percentage": 90.16, "elapsed_time": "16:20:26", "remaining_time": "1:46:57", "throughput": 3346.95, "total_tokens": 196888176} +{"current_steps": 161920, "total_steps": 179580, "loss": 0.877, "lr": 1.4587136870558156e-06, "epoch": 18.033188551063592, "percentage": 90.17, "elapsed_time": "16:20:27", "remaining_time": "1:46:56", "throughput": 3346.95, "total_tokens": 196894224} +{"current_steps": 161925, "total_steps": 179580, "loss": 0.8468, "lr": 1.4578959738290015e-06, "epoch": 18.03374540594721, "percentage": 90.17, "elapsed_time": "16:20:29", "remaining_time": "1:46:54", "throughput": 3346.96, "total_tokens": 196900560} +{"current_steps": 161930, "total_steps": 179580, "loss": 0.6637, "lr": 1.4570784829762235e-06, "epoch": 18.034302260830827, "percentage": 90.17, "elapsed_time": "16:20:31", "remaining_time": "1:46:52", "throughput": 3346.96, "total_tokens": 196906672} +{"current_steps": 161935, "total_steps": 179580, "loss": 0.7511, "lr": 1.4562612145052002e-06, "epoch": 18.034859115714443, "percentage": 90.17, "elapsed_time": "16:20:33", "remaining_time": "1:46:50", "throughput": 3346.96, "total_tokens": 196913008} +{"current_steps": 161940, "total_steps": 179580, "loss": 0.7406, "lr": 1.4554441684236558e-06, "epoch": 18.035415970598063, "percentage": 90.18, "elapsed_time": "16:20:35", "remaining_time": "1:46:48", "throughput": 3346.97, "total_tokens": 196919312} +{"current_steps": 161945, "total_steps": 179580, "loss": 0.7588, "lr": 1.4546273447393038e-06, "epoch": 18.03597282548168, "percentage": 90.18, "elapsed_time": "16:20:36", "remaining_time": "1:46:47", "throughput": 3346.98, "total_tokens": 196925840} +{"current_steps": 161950, "total_steps": 179580, "loss": 0.5211, "lr": 1.4538107434598602e-06, "epoch": 18.036529680365298, "percentage": 90.18, "elapsed_time": "16:20:38", "remaining_time": "1:46:45", "throughput": 3346.98, "total_tokens": 196931984} +{"current_steps": 161955, "total_steps": 179580, "loss": 0.6757, "lr": 1.4529943645930355e-06, "epoch": 18.037086535248914, "percentage": 90.19, "elapsed_time": "16:20:40", "remaining_time": "1:46:43", "throughput": 3346.98, "total_tokens": 196938320} +{"current_steps": 161960, "total_steps": 179580, "loss": 0.7338, "lr": 1.4521782081465485e-06, "epoch": 18.03764339013253, "percentage": 90.19, "elapsed_time": "16:20:42", "remaining_time": "1:46:41", "throughput": 3346.99, "total_tokens": 196944400} +{"current_steps": 161965, "total_steps": 179580, "loss": 0.7833, "lr": 1.4513622741281069e-06, "epoch": 18.03820024501615, "percentage": 90.19, "elapsed_time": "16:20:44", "remaining_time": "1:46:39", "throughput": 3346.99, "total_tokens": 196950512} +{"current_steps": 161970, "total_steps": 179580, "loss": 0.4614, "lr": 1.4505465625454128e-06, "epoch": 18.038757099899765, "percentage": 90.19, "elapsed_time": "16:20:45", "remaining_time": "1:46:37", "throughput": 3347.0, "total_tokens": 196957072} +{"current_steps": 161975, "total_steps": 179580, "loss": 0.9098, "lr": 1.4497310734061714e-06, "epoch": 18.039313954783385, "percentage": 90.2, "elapsed_time": "16:20:47", "remaining_time": "1:46:36", "throughput": 3347.0, "total_tokens": 196963088} +{"current_steps": 161980, "total_steps": 179580, "loss": 0.5842, "lr": 1.4489158067180901e-06, "epoch": 18.039870809667, "percentage": 90.2, "elapsed_time": "16:20:49", "remaining_time": "1:46:34", "throughput": 3347.01, "total_tokens": 196968944} +{"current_steps": 161985, "total_steps": 179580, "loss": 0.7728, "lr": 1.4481007624888659e-06, "epoch": 18.040427664550617, "percentage": 90.2, "elapsed_time": "16:20:51", "remaining_time": "1:46:32", "throughput": 3347.01, "total_tokens": 196974960} +{"current_steps": 161990, "total_steps": 179580, "loss": 0.5479, "lr": 1.4472859407262064e-06, "epoch": 18.040984519434236, "percentage": 90.2, "elapsed_time": "16:20:52", "remaining_time": "1:46:30", "throughput": 3347.01, "total_tokens": 196980976} +{"current_steps": 161995, "total_steps": 179580, "loss": 0.6208, "lr": 1.446471341437794e-06, "epoch": 18.041541374317852, "percentage": 90.21, "elapsed_time": "16:20:54", "remaining_time": "1:46:28", "throughput": 3347.01, "total_tokens": 196986864} +{"current_steps": 162000, "total_steps": 179580, "loss": 0.6532, "lr": 1.445656964631334e-06, "epoch": 18.04209822920147, "percentage": 90.21, "elapsed_time": "16:20:56", "remaining_time": "1:46:27", "throughput": 3347.02, "total_tokens": 196993136} +{"current_steps": 162005, "total_steps": 179580, "loss": 0.696, "lr": 1.4448428103145118e-06, "epoch": 18.042655084085087, "percentage": 90.21, "elapsed_time": "16:20:58", "remaining_time": "1:46:25", "throughput": 3347.02, "total_tokens": 196999312} +{"current_steps": 162010, "total_steps": 179580, "loss": 0.7125, "lr": 1.444028878495024e-06, "epoch": 18.043211938968703, "percentage": 90.22, "elapsed_time": "16:20:59", "remaining_time": "1:46:23", "throughput": 3347.02, "total_tokens": 197004880} +{"current_steps": 162015, "total_steps": 179580, "loss": 0.7372, "lr": 1.4432151691805562e-06, "epoch": 18.043768793852323, "percentage": 90.22, "elapsed_time": "16:21:01", "remaining_time": "1:46:21", "throughput": 3347.03, "total_tokens": 197011216} +{"current_steps": 162020, "total_steps": 179580, "loss": 0.8076, "lr": 1.4424016823787966e-06, "epoch": 18.04432564873594, "percentage": 90.22, "elapsed_time": "16:21:03", "remaining_time": "1:46:19", "throughput": 3347.03, "total_tokens": 197017648} +{"current_steps": 162025, "total_steps": 179580, "loss": 0.7689, "lr": 1.4415884180974226e-06, "epoch": 18.044882503619558, "percentage": 90.22, "elapsed_time": "16:21:05", "remaining_time": "1:46:17", "throughput": 3347.04, "total_tokens": 197023792} +{"current_steps": 162030, "total_steps": 179580, "loss": 0.6359, "lr": 1.440775376344125e-06, "epoch": 18.045439358503174, "percentage": 90.23, "elapsed_time": "16:21:06", "remaining_time": "1:46:16", "throughput": 3347.04, "total_tokens": 197029936} +{"current_steps": 162035, "total_steps": 179580, "loss": 0.7158, "lr": 1.4399625571265785e-06, "epoch": 18.04599621338679, "percentage": 90.23, "elapsed_time": "16:21:08", "remaining_time": "1:46:14", "throughput": 3347.04, "total_tokens": 197036048} +{"current_steps": 162040, "total_steps": 179580, "loss": 0.5792, "lr": 1.4391499604524599e-06, "epoch": 18.04655306827041, "percentage": 90.23, "elapsed_time": "16:21:10", "remaining_time": "1:46:12", "throughput": 3347.05, "total_tokens": 197042320} +{"current_steps": 162045, "total_steps": 179580, "loss": 0.8421, "lr": 1.438337586329444e-06, "epoch": 18.047109923154025, "percentage": 90.24, "elapsed_time": "16:21:12", "remaining_time": "1:46:10", "throughput": 3347.05, "total_tokens": 197048496} +{"current_steps": 162050, "total_steps": 179580, "loss": 0.909, "lr": 1.4375254347652133e-06, "epoch": 18.047666778037645, "percentage": 90.24, "elapsed_time": "16:21:13", "remaining_time": "1:46:08", "throughput": 3347.06, "total_tokens": 197054672} +{"current_steps": 162055, "total_steps": 179580, "loss": 0.7715, "lr": 1.4367135057674257e-06, "epoch": 18.04822363292126, "percentage": 90.24, "elapsed_time": "16:21:15", "remaining_time": "1:46:06", "throughput": 3347.06, "total_tokens": 197060720} +{"current_steps": 162060, "total_steps": 179580, "loss": 0.6361, "lr": 1.435901799343764e-06, "epoch": 18.048780487804876, "percentage": 90.24, "elapsed_time": "16:21:17", "remaining_time": "1:46:05", "throughput": 3347.07, "total_tokens": 197066896} +{"current_steps": 162065, "total_steps": 179580, "loss": 0.5427, "lr": 1.4350903155018858e-06, "epoch": 18.049337342688496, "percentage": 90.25, "elapsed_time": "16:21:19", "remaining_time": "1:46:03", "throughput": 3347.07, "total_tokens": 197073200} +{"current_steps": 162070, "total_steps": 179580, "loss": 0.7104, "lr": 1.4342790542494627e-06, "epoch": 18.04989419757211, "percentage": 90.25, "elapsed_time": "16:21:21", "remaining_time": "1:46:01", "throughput": 3347.07, "total_tokens": 197079472} +{"current_steps": 162075, "total_steps": 179580, "loss": 0.7585, "lr": 1.4334680155941526e-06, "epoch": 18.05045105245573, "percentage": 90.25, "elapsed_time": "16:21:22", "remaining_time": "1:45:59", "throughput": 3347.08, "total_tokens": 197084976} +{"current_steps": 162080, "total_steps": 179580, "loss": 0.6783, "lr": 1.4326571995436134e-06, "epoch": 18.051007907339347, "percentage": 90.26, "elapsed_time": "16:21:24", "remaining_time": "1:45:57", "throughput": 3347.08, "total_tokens": 197090992} +{"current_steps": 162085, "total_steps": 179580, "loss": 0.7403, "lr": 1.4318466061055165e-06, "epoch": 18.051564762222966, "percentage": 90.26, "elapsed_time": "16:21:26", "remaining_time": "1:45:56", "throughput": 3347.08, "total_tokens": 197096816} +{"current_steps": 162090, "total_steps": 179580, "loss": 0.8985, "lr": 1.4310362352875084e-06, "epoch": 18.052121617106582, "percentage": 90.26, "elapsed_time": "16:21:28", "remaining_time": "1:45:54", "throughput": 3347.09, "total_tokens": 197103408} +{"current_steps": 162095, "total_steps": 179580, "loss": 0.7501, "lr": 1.4302260870972444e-06, "epoch": 18.0526784719902, "percentage": 90.26, "elapsed_time": "16:21:29", "remaining_time": "1:45:52", "throughput": 3347.09, "total_tokens": 197109328} +{"current_steps": 162100, "total_steps": 179580, "loss": 0.6713, "lr": 1.4294161615423767e-06, "epoch": 18.053235326873818, "percentage": 90.27, "elapsed_time": "16:21:31", "remaining_time": "1:45:50", "throughput": 3347.09, "total_tokens": 197115312} +{"current_steps": 162105, "total_steps": 179580, "loss": 0.8445, "lr": 1.428606458630563e-06, "epoch": 18.053792181757434, "percentage": 90.27, "elapsed_time": "16:21:33", "remaining_time": "1:45:48", "throughput": 3347.1, "total_tokens": 197121168} +{"current_steps": 162110, "total_steps": 179580, "loss": 0.5235, "lr": 1.4277969783694444e-06, "epoch": 18.054349036641053, "percentage": 90.27, "elapsed_time": "16:21:34", "remaining_time": "1:45:46", "throughput": 3347.1, "total_tokens": 197127184} +{"current_steps": 162115, "total_steps": 179580, "loss": 0.7699, "lr": 1.4269877207666705e-06, "epoch": 18.05490589152467, "percentage": 90.27, "elapsed_time": "16:21:36", "remaining_time": "1:45:45", "throughput": 3347.1, "total_tokens": 197133296} +{"current_steps": 162120, "total_steps": 179580, "loss": 0.9375, "lr": 1.4261786858298793e-06, "epoch": 18.055462746408285, "percentage": 90.28, "elapsed_time": "16:21:38", "remaining_time": "1:45:43", "throughput": 3347.11, "total_tokens": 197139728} +{"current_steps": 162125, "total_steps": 179580, "loss": 0.6562, "lr": 1.4253698735667203e-06, "epoch": 18.056019601291904, "percentage": 90.28, "elapsed_time": "16:21:40", "remaining_time": "1:45:41", "throughput": 3347.11, "total_tokens": 197145360} +{"current_steps": 162130, "total_steps": 179580, "loss": 0.7516, "lr": 1.4245612839848293e-06, "epoch": 18.05657645617552, "percentage": 90.28, "elapsed_time": "16:21:41", "remaining_time": "1:45:39", "throughput": 3347.12, "total_tokens": 197151568} +{"current_steps": 162135, "total_steps": 179580, "loss": 0.9312, "lr": 1.4237529170918502e-06, "epoch": 18.05713331105914, "percentage": 90.29, "elapsed_time": "16:21:43", "remaining_time": "1:45:37", "throughput": 3347.12, "total_tokens": 197157840} +{"current_steps": 162140, "total_steps": 179580, "loss": 0.5808, "lr": 1.42294477289541e-06, "epoch": 18.057690165942756, "percentage": 90.29, "elapsed_time": "16:21:45", "remaining_time": "1:45:35", "throughput": 3347.12, "total_tokens": 197163984} +{"current_steps": 162145, "total_steps": 179580, "loss": 0.5571, "lr": 1.4221368514031469e-06, "epoch": 18.05824702082637, "percentage": 90.29, "elapsed_time": "16:21:47", "remaining_time": "1:45:34", "throughput": 3347.13, "total_tokens": 197170064} +{"current_steps": 162150, "total_steps": 179580, "loss": 0.8236, "lr": 1.4213291526226858e-06, "epoch": 18.05880387570999, "percentage": 90.29, "elapsed_time": "16:21:49", "remaining_time": "1:45:32", "throughput": 3347.13, "total_tokens": 197176240} +{"current_steps": 162155, "total_steps": 179580, "loss": 0.8645, "lr": 1.4205216765616702e-06, "epoch": 18.059360730593607, "percentage": 90.3, "elapsed_time": "16:21:50", "remaining_time": "1:45:30", "throughput": 3347.14, "total_tokens": 197182352} +{"current_steps": 162160, "total_steps": 179580, "loss": 0.7677, "lr": 1.4197144232277166e-06, "epoch": 18.059917585477226, "percentage": 90.3, "elapsed_time": "16:21:52", "remaining_time": "1:45:28", "throughput": 3347.14, "total_tokens": 197188080} +{"current_steps": 162165, "total_steps": 179580, "loss": 1.0298, "lr": 1.4189073926284519e-06, "epoch": 18.060474440360842, "percentage": 90.3, "elapsed_time": "16:21:54", "remaining_time": "1:45:26", "throughput": 3347.14, "total_tokens": 197194256} +{"current_steps": 162170, "total_steps": 179580, "loss": 0.7843, "lr": 1.418100584771495e-06, "epoch": 18.061031295244458, "percentage": 90.31, "elapsed_time": "16:21:55", "remaining_time": "1:45:25", "throughput": 3347.14, "total_tokens": 197200176} +{"current_steps": 162175, "total_steps": 179580, "loss": 0.7035, "lr": 1.417293999664479e-06, "epoch": 18.061588150128078, "percentage": 90.31, "elapsed_time": "16:21:57", "remaining_time": "1:45:23", "throughput": 3347.15, "total_tokens": 197206416} +{"current_steps": 162180, "total_steps": 179580, "loss": 0.7266, "lr": 1.4164876373150116e-06, "epoch": 18.062145005011693, "percentage": 90.31, "elapsed_time": "16:21:59", "remaining_time": "1:45:21", "throughput": 3347.15, "total_tokens": 197212496} +{"current_steps": 162185, "total_steps": 179580, "loss": 0.6162, "lr": 1.4156814977307143e-06, "epoch": 18.062701859895313, "percentage": 90.31, "elapsed_time": "16:22:01", "remaining_time": "1:45:19", "throughput": 3347.15, "total_tokens": 197218736} +{"current_steps": 162190, "total_steps": 179580, "loss": 0.688, "lr": 1.4148755809191978e-06, "epoch": 18.06325871477893, "percentage": 90.32, "elapsed_time": "16:22:03", "remaining_time": "1:45:17", "throughput": 3347.16, "total_tokens": 197224688} +{"current_steps": 162195, "total_steps": 179580, "loss": 0.6804, "lr": 1.4140698868880808e-06, "epoch": 18.063815569662545, "percentage": 90.32, "elapsed_time": "16:22:04", "remaining_time": "1:45:15", "throughput": 3347.16, "total_tokens": 197230320} +{"current_steps": 162200, "total_steps": 179580, "loss": 0.6208, "lr": 1.4132644156449687e-06, "epoch": 18.064372424546164, "percentage": 90.32, "elapsed_time": "16:22:06", "remaining_time": "1:45:14", "throughput": 3347.16, "total_tokens": 197236304} +{"current_steps": 162205, "total_steps": 179580, "loss": 0.7746, "lr": 1.4124591671974718e-06, "epoch": 18.06492927942978, "percentage": 90.32, "elapsed_time": "16:22:08", "remaining_time": "1:45:12", "throughput": 3347.16, "total_tokens": 197242352} +{"current_steps": 162210, "total_steps": 179580, "loss": 0.4881, "lr": 1.411654141553198e-06, "epoch": 18.0654861343134, "percentage": 90.33, "elapsed_time": "16:22:09", "remaining_time": "1:45:10", "throughput": 3347.17, "total_tokens": 197248336} +{"current_steps": 162215, "total_steps": 179580, "loss": 0.8341, "lr": 1.4108493387197497e-06, "epoch": 18.066042989197015, "percentage": 90.33, "elapsed_time": "16:22:11", "remaining_time": "1:45:08", "throughput": 3347.17, "total_tokens": 197254640} +{"current_steps": 162220, "total_steps": 179580, "loss": 0.7173, "lr": 1.4100447587047261e-06, "epoch": 18.06659984408063, "percentage": 90.33, "elapsed_time": "16:22:13", "remaining_time": "1:45:06", "throughput": 3347.17, "total_tokens": 197260848} +{"current_steps": 162225, "total_steps": 179580, "loss": 0.7657, "lr": 1.4092404015157295e-06, "epoch": 18.06715669896425, "percentage": 90.34, "elapsed_time": "16:22:15", "remaining_time": "1:45:04", "throughput": 3347.18, "total_tokens": 197267120} +{"current_steps": 162230, "total_steps": 179580, "loss": 0.5822, "lr": 1.4084362671603623e-06, "epoch": 18.067713553847867, "percentage": 90.34, "elapsed_time": "16:22:17", "remaining_time": "1:45:03", "throughput": 3347.18, "total_tokens": 197273296} +{"current_steps": 162235, "total_steps": 179580, "loss": 0.6302, "lr": 1.407632355646213e-06, "epoch": 18.068270408731486, "percentage": 90.34, "elapsed_time": "16:22:18", "remaining_time": "1:45:01", "throughput": 3347.19, "total_tokens": 197279408} +{"current_steps": 162240, "total_steps": 179580, "loss": 0.7669, "lr": 1.406828666980875e-06, "epoch": 18.068827263615102, "percentage": 90.34, "elapsed_time": "16:22:20", "remaining_time": "1:44:59", "throughput": 3347.19, "total_tokens": 197285680} +{"current_steps": 162245, "total_steps": 179580, "loss": 0.64, "lr": 1.4060252011719456e-06, "epoch": 18.069384118498718, "percentage": 90.35, "elapsed_time": "16:22:22", "remaining_time": "1:44:57", "throughput": 3347.19, "total_tokens": 197291568} +{"current_steps": 162250, "total_steps": 179580, "loss": 0.9231, "lr": 1.4052219582270098e-06, "epoch": 18.069940973382337, "percentage": 90.35, "elapsed_time": "16:22:24", "remaining_time": "1:44:55", "throughput": 3347.19, "total_tokens": 197297584} +{"current_steps": 162255, "total_steps": 179580, "loss": 0.8513, "lr": 1.404418938153662e-06, "epoch": 18.070497828265953, "percentage": 90.35, "elapsed_time": "16:22:26", "remaining_time": "1:44:54", "throughput": 3347.2, "total_tokens": 197304048} +{"current_steps": 162260, "total_steps": 179580, "loss": 0.6164, "lr": 1.4036161409594767e-06, "epoch": 18.071054683149573, "percentage": 90.36, "elapsed_time": "16:22:27", "remaining_time": "1:44:52", "throughput": 3347.2, "total_tokens": 197309552} +{"current_steps": 162265, "total_steps": 179580, "loss": 0.7874, "lr": 1.402813566652042e-06, "epoch": 18.07161153803319, "percentage": 90.36, "elapsed_time": "16:22:29", "remaining_time": "1:44:50", "throughput": 3347.21, "total_tokens": 197315824} +{"current_steps": 162270, "total_steps": 179580, "loss": 0.7374, "lr": 1.402011215238938e-06, "epoch": 18.072168392916804, "percentage": 90.36, "elapsed_time": "16:22:31", "remaining_time": "1:44:48", "throughput": 3347.21, "total_tokens": 197322384} +{"current_steps": 162275, "total_steps": 179580, "loss": 0.883, "lr": 1.4012090867277478e-06, "epoch": 18.072725247800424, "percentage": 90.36, "elapsed_time": "16:22:33", "remaining_time": "1:44:46", "throughput": 3347.22, "total_tokens": 197328496} +{"current_steps": 162280, "total_steps": 179580, "loss": 1.1094, "lr": 1.4004071811260456e-06, "epoch": 18.07328210268404, "percentage": 90.37, "elapsed_time": "16:22:34", "remaining_time": "1:44:44", "throughput": 3347.22, "total_tokens": 197334192} +{"current_steps": 162285, "total_steps": 179580, "loss": 0.6537, "lr": 1.399605498441403e-06, "epoch": 18.07383895756766, "percentage": 90.37, "elapsed_time": "16:22:36", "remaining_time": "1:44:43", "throughput": 3347.22, "total_tokens": 197340400} +{"current_steps": 162290, "total_steps": 179580, "loss": 0.6819, "lr": 1.3988040386813921e-06, "epoch": 18.074395812451275, "percentage": 90.37, "elapsed_time": "16:22:38", "remaining_time": "1:44:41", "throughput": 3347.23, "total_tokens": 197346640} +{"current_steps": 162295, "total_steps": 179580, "loss": 0.6254, "lr": 1.3980028018535901e-06, "epoch": 18.07495266733489, "percentage": 90.37, "elapsed_time": "16:22:40", "remaining_time": "1:44:39", "throughput": 3347.23, "total_tokens": 197353136} +{"current_steps": 162300, "total_steps": 179580, "loss": 0.4965, "lr": 1.3972017879655601e-06, "epoch": 18.07550952221851, "percentage": 90.38, "elapsed_time": "16:22:41", "remaining_time": "1:44:37", "throughput": 3347.23, "total_tokens": 197359184} +{"current_steps": 162305, "total_steps": 179580, "loss": 0.8572, "lr": 1.3964009970248714e-06, "epoch": 18.076066377102126, "percentage": 90.38, "elapsed_time": "16:22:43", "remaining_time": "1:44:35", "throughput": 3347.24, "total_tokens": 197365072} +{"current_steps": 162310, "total_steps": 179580, "loss": 0.6275, "lr": 1.3956004290390817e-06, "epoch": 18.076623231985746, "percentage": 90.38, "elapsed_time": "16:22:45", "remaining_time": "1:44:33", "throughput": 3347.24, "total_tokens": 197371216} +{"current_steps": 162315, "total_steps": 179580, "loss": 0.9712, "lr": 1.39480008401576e-06, "epoch": 18.07718008686936, "percentage": 90.39, "elapsed_time": "16:22:47", "remaining_time": "1:44:32", "throughput": 3347.25, "total_tokens": 197377648} +{"current_steps": 162320, "total_steps": 179580, "loss": 0.6653, "lr": 1.3939999619624612e-06, "epoch": 18.077736941752978, "percentage": 90.39, "elapsed_time": "16:22:48", "remaining_time": "1:44:30", "throughput": 3347.25, "total_tokens": 197383728} +{"current_steps": 162325, "total_steps": 179580, "loss": 0.6462, "lr": 1.3932000628867515e-06, "epoch": 18.078293796636597, "percentage": 90.39, "elapsed_time": "16:22:50", "remaining_time": "1:44:28", "throughput": 3347.25, "total_tokens": 197389744} +{"current_steps": 162330, "total_steps": 179580, "loss": 0.7509, "lr": 1.3924003867961749e-06, "epoch": 18.078850651520213, "percentage": 90.39, "elapsed_time": "16:22:52", "remaining_time": "1:44:26", "throughput": 3347.25, "total_tokens": 197395888} +{"current_steps": 162335, "total_steps": 179580, "loss": 0.4814, "lr": 1.3916009336982949e-06, "epoch": 18.079407506403832, "percentage": 90.4, "elapsed_time": "16:22:54", "remaining_time": "1:44:24", "throughput": 3347.25, "total_tokens": 197402032} +{"current_steps": 162340, "total_steps": 179580, "loss": 0.828, "lr": 1.3908017036006527e-06, "epoch": 18.07996436128745, "percentage": 90.4, "elapsed_time": "16:22:56", "remaining_time": "1:44:23", "throughput": 3347.26, "total_tokens": 197408176} +{"current_steps": 162345, "total_steps": 179580, "loss": 0.8723, "lr": 1.3900026965108088e-06, "epoch": 18.080521216171064, "percentage": 90.4, "elapsed_time": "16:22:57", "remaining_time": "1:44:21", "throughput": 3347.26, "total_tokens": 197414288} +{"current_steps": 162350, "total_steps": 179580, "loss": 0.5954, "lr": 1.389203912436307e-06, "epoch": 18.081078071054684, "percentage": 90.41, "elapsed_time": "16:22:59", "remaining_time": "1:44:19", "throughput": 3347.26, "total_tokens": 197420656} +{"current_steps": 162355, "total_steps": 179580, "loss": 0.5514, "lr": 1.388405351384689e-06, "epoch": 18.0816349259383, "percentage": 90.41, "elapsed_time": "16:23:01", "remaining_time": "1:44:17", "throughput": 3347.27, "total_tokens": 197426832} +{"current_steps": 162360, "total_steps": 179580, "loss": 0.761, "lr": 1.3876070133634955e-06, "epoch": 18.08219178082192, "percentage": 90.41, "elapsed_time": "16:23:03", "remaining_time": "1:44:15", "throughput": 3347.27, "total_tokens": 197433456} +{"current_steps": 162365, "total_steps": 179580, "loss": 0.7012, "lr": 1.3868088983802791e-06, "epoch": 18.082748635705535, "percentage": 90.41, "elapsed_time": "16:23:05", "remaining_time": "1:44:13", "throughput": 3347.28, "total_tokens": 197439504} +{"current_steps": 162370, "total_steps": 179580, "loss": 0.8376, "lr": 1.386011006442567e-06, "epoch": 18.08330549058915, "percentage": 90.42, "elapsed_time": "16:23:06", "remaining_time": "1:44:12", "throughput": 3347.28, "total_tokens": 197445872} +{"current_steps": 162375, "total_steps": 179580, "loss": 0.6558, "lr": 1.385213337557903e-06, "epoch": 18.08386234547277, "percentage": 90.42, "elapsed_time": "16:23:08", "remaining_time": "1:44:10", "throughput": 3347.29, "total_tokens": 197452176} +{"current_steps": 162380, "total_steps": 179580, "loss": 0.7093, "lr": 1.3844158917338117e-06, "epoch": 18.084419200356386, "percentage": 90.42, "elapsed_time": "16:23:10", "remaining_time": "1:44:08", "throughput": 3347.29, "total_tokens": 197458384} +{"current_steps": 162385, "total_steps": 179580, "loss": 0.5742, "lr": 1.3836186689778402e-06, "epoch": 18.084976055240006, "percentage": 90.42, "elapsed_time": "16:23:12", "remaining_time": "1:44:06", "throughput": 3347.3, "total_tokens": 197464784} +{"current_steps": 162390, "total_steps": 179580, "loss": 0.6723, "lr": 1.382821669297507e-06, "epoch": 18.08553291012362, "percentage": 90.43, "elapsed_time": "16:23:14", "remaining_time": "1:44:04", "throughput": 3347.3, "total_tokens": 197470864} +{"current_steps": 162395, "total_steps": 179580, "loss": 0.7748, "lr": 1.382024892700351e-06, "epoch": 18.086089765007237, "percentage": 90.43, "elapsed_time": "16:23:15", "remaining_time": "1:44:03", "throughput": 3347.3, "total_tokens": 197476784} +{"current_steps": 162400, "total_steps": 179580, "loss": 0.7307, "lr": 1.3812283391938852e-06, "epoch": 18.086646619890857, "percentage": 90.43, "elapsed_time": "16:23:17", "remaining_time": "1:44:01", "throughput": 3347.31, "total_tokens": 197482832} +{"current_steps": 162405, "total_steps": 179580, "loss": 0.5297, "lr": 1.3804320087856453e-06, "epoch": 18.087203474774473, "percentage": 90.44, "elapsed_time": "16:23:19", "remaining_time": "1:43:59", "throughput": 3347.31, "total_tokens": 197488752} +{"current_steps": 162410, "total_steps": 179580, "loss": 0.7472, "lr": 1.379635901483145e-06, "epoch": 18.087760329658092, "percentage": 90.44, "elapsed_time": "16:23:21", "remaining_time": "1:43:57", "throughput": 3347.3, "total_tokens": 197495088} +{"current_steps": 162415, "total_steps": 179580, "loss": 0.622, "lr": 1.3788400172939086e-06, "epoch": 18.088317184541708, "percentage": 90.44, "elapsed_time": "16:23:23", "remaining_time": "1:43:55", "throughput": 3347.31, "total_tokens": 197501488} +{"current_steps": 162420, "total_steps": 179580, "loss": 0.6551, "lr": 1.378044356225458e-06, "epoch": 18.088874039425324, "percentage": 90.44, "elapsed_time": "16:23:24", "remaining_time": "1:43:53", "throughput": 3347.31, "total_tokens": 197507824} +{"current_steps": 162425, "total_steps": 179580, "loss": 0.9884, "lr": 1.377248918285301e-06, "epoch": 18.089430894308943, "percentage": 90.45, "elapsed_time": "16:23:26", "remaining_time": "1:43:52", "throughput": 3347.31, "total_tokens": 197513808} +{"current_steps": 162430, "total_steps": 179580, "loss": 0.5184, "lr": 1.376453703480951e-06, "epoch": 18.08998774919256, "percentage": 90.45, "elapsed_time": "16:23:28", "remaining_time": "1:43:50", "throughput": 3347.32, "total_tokens": 197519504} +{"current_steps": 162435, "total_steps": 179580, "loss": 0.7648, "lr": 1.3756587118199271e-06, "epoch": 18.09054460407618, "percentage": 90.45, "elapsed_time": "16:23:30", "remaining_time": "1:43:48", "throughput": 3347.32, "total_tokens": 197525584} +{"current_steps": 162440, "total_steps": 179580, "loss": 0.4707, "lr": 1.3748639433097342e-06, "epoch": 18.091101458959795, "percentage": 90.46, "elapsed_time": "16:23:31", "remaining_time": "1:43:46", "throughput": 3347.32, "total_tokens": 197531536} +{"current_steps": 162445, "total_steps": 179580, "loss": 0.7315, "lr": 1.3740693979578777e-06, "epoch": 18.091658313843414, "percentage": 90.46, "elapsed_time": "16:23:33", "remaining_time": "1:43:44", "throughput": 3347.33, "total_tokens": 197537840} +{"current_steps": 162450, "total_steps": 179580, "loss": 0.5533, "lr": 1.3732750757718627e-06, "epoch": 18.09221516872703, "percentage": 90.46, "elapsed_time": "16:23:35", "remaining_time": "1:43:43", "throughput": 3347.33, "total_tokens": 197543920} +{"current_steps": 162455, "total_steps": 179580, "loss": 0.7735, "lr": 1.3724809767591967e-06, "epoch": 18.092772023610646, "percentage": 90.46, "elapsed_time": "16:23:37", "remaining_time": "1:43:41", "throughput": 3347.33, "total_tokens": 197549648} +{"current_steps": 162460, "total_steps": 179580, "loss": 0.8899, "lr": 1.3716871009273742e-06, "epoch": 18.093328878494265, "percentage": 90.47, "elapsed_time": "16:23:38", "remaining_time": "1:43:39", "throughput": 3347.34, "total_tokens": 197555920} +{"current_steps": 162465, "total_steps": 179580, "loss": 0.5861, "lr": 1.3708934482839026e-06, "epoch": 18.09388573337788, "percentage": 90.47, "elapsed_time": "16:23:40", "remaining_time": "1:43:37", "throughput": 3347.34, "total_tokens": 197562352} +{"current_steps": 162470, "total_steps": 179580, "loss": 0.5553, "lr": 1.3701000188362734e-06, "epoch": 18.0944425882615, "percentage": 90.47, "elapsed_time": "16:23:42", "remaining_time": "1:43:35", "throughput": 3347.34, "total_tokens": 197568304} +{"current_steps": 162475, "total_steps": 179580, "loss": 0.716, "lr": 1.3693068125919806e-06, "epoch": 18.094999443145117, "percentage": 90.47, "elapsed_time": "16:23:44", "remaining_time": "1:43:33", "throughput": 3347.35, "total_tokens": 197574288} +{"current_steps": 162480, "total_steps": 179580, "loss": 0.772, "lr": 1.3685138295585153e-06, "epoch": 18.095556298028733, "percentage": 90.48, "elapsed_time": "16:23:45", "remaining_time": "1:43:32", "throughput": 3347.35, "total_tokens": 197580592} +{"current_steps": 162485, "total_steps": 179580, "loss": 0.7637, "lr": 1.3677210697433717e-06, "epoch": 18.096113152912352, "percentage": 90.48, "elapsed_time": "16:23:47", "remaining_time": "1:43:30", "throughput": 3347.35, "total_tokens": 197586736} +{"current_steps": 162490, "total_steps": 179580, "loss": 0.6935, "lr": 1.3669285331540383e-06, "epoch": 18.096670007795968, "percentage": 90.48, "elapsed_time": "16:23:49", "remaining_time": "1:43:28", "throughput": 3347.36, "total_tokens": 197592912} +{"current_steps": 162495, "total_steps": 179580, "loss": 0.9529, "lr": 1.3661362197979977e-06, "epoch": 18.097226862679587, "percentage": 90.49, "elapsed_time": "16:23:51", "remaining_time": "1:43:26", "throughput": 3347.36, "total_tokens": 197599152} +{"current_steps": 162500, "total_steps": 179580, "loss": 0.4779, "lr": 1.3653441296827386e-06, "epoch": 18.097783717563203, "percentage": 90.49, "elapsed_time": "16:23:53", "remaining_time": "1:43:24", "throughput": 3347.36, "total_tokens": 197605072} +{"current_steps": 162505, "total_steps": 179580, "loss": 0.718, "lr": 1.3645522628157326e-06, "epoch": 18.09834057244682, "percentage": 90.49, "elapsed_time": "16:23:54", "remaining_time": "1:43:23", "throughput": 3347.37, "total_tokens": 197611120} +{"current_steps": 162510, "total_steps": 179580, "loss": 0.7582, "lr": 1.363760619204474e-06, "epoch": 18.09889742733044, "percentage": 90.49, "elapsed_time": "16:23:56", "remaining_time": "1:43:21", "throughput": 3347.37, "total_tokens": 197617328} +{"current_steps": 162515, "total_steps": 179580, "loss": 0.7094, "lr": 1.3629691988564314e-06, "epoch": 18.099454282214055, "percentage": 90.5, "elapsed_time": "16:23:58", "remaining_time": "1:43:19", "throughput": 3347.38, "total_tokens": 197623664} +{"current_steps": 162520, "total_steps": 179580, "loss": 0.7053, "lr": 1.3621780017790825e-06, "epoch": 18.100011137097674, "percentage": 90.5, "elapsed_time": "16:23:59", "remaining_time": "1:43:17", "throughput": 3347.38, "total_tokens": 197629232} +{"current_steps": 162525, "total_steps": 179580, "loss": 0.6202, "lr": 1.3613870279798963e-06, "epoch": 18.10056799198129, "percentage": 90.5, "elapsed_time": "16:24:01", "remaining_time": "1:43:15", "throughput": 3347.38, "total_tokens": 197635248} +{"current_steps": 162530, "total_steps": 179580, "loss": 0.7282, "lr": 1.3605962774663527e-06, "epoch": 18.101124846864906, "percentage": 90.51, "elapsed_time": "16:24:03", "remaining_time": "1:43:13", "throughput": 3347.38, "total_tokens": 197640912} +{"current_steps": 162535, "total_steps": 179580, "loss": 0.8833, "lr": 1.3598057502459155e-06, "epoch": 18.101681701748525, "percentage": 90.51, "elapsed_time": "16:24:05", "remaining_time": "1:43:12", "throughput": 3347.39, "total_tokens": 197647248} +{"current_steps": 162540, "total_steps": 179580, "loss": 0.7422, "lr": 1.3590154463260562e-06, "epoch": 18.10223855663214, "percentage": 90.51, "elapsed_time": "16:24:06", "remaining_time": "1:43:10", "throughput": 3347.39, "total_tokens": 197653360} +{"current_steps": 162545, "total_steps": 179580, "loss": 0.4187, "lr": 1.358225365714233e-06, "epoch": 18.10279541151576, "percentage": 90.51, "elapsed_time": "16:24:08", "remaining_time": "1:43:08", "throughput": 3347.4, "total_tokens": 197659696} +{"current_steps": 162550, "total_steps": 179580, "loss": 0.7394, "lr": 1.3574355084179146e-06, "epoch": 18.103352266399376, "percentage": 90.52, "elapsed_time": "16:24:10", "remaining_time": "1:43:06", "throughput": 3347.4, "total_tokens": 197666000} +{"current_steps": 162555, "total_steps": 179580, "loss": 1.0239, "lr": 1.3566458744445566e-06, "epoch": 18.103909121282992, "percentage": 90.52, "elapsed_time": "16:24:12", "remaining_time": "1:43:04", "throughput": 3347.41, "total_tokens": 197671440} +{"current_steps": 162560, "total_steps": 179580, "loss": 0.6492, "lr": 1.3558564638016275e-06, "epoch": 18.104465976166612, "percentage": 90.52, "elapsed_time": "16:24:13", "remaining_time": "1:43:02", "throughput": 3347.41, "total_tokens": 197677360} +{"current_steps": 162565, "total_steps": 179580, "loss": 0.799, "lr": 1.3550672764965744e-06, "epoch": 18.105022831050228, "percentage": 90.53, "elapsed_time": "16:24:15", "remaining_time": "1:43:01", "throughput": 3347.41, "total_tokens": 197683920} +{"current_steps": 162570, "total_steps": 179580, "loss": 0.6648, "lr": 1.3542783125368552e-06, "epoch": 18.105579685933847, "percentage": 90.53, "elapsed_time": "16:24:17", "remaining_time": "1:42:59", "throughput": 3347.42, "total_tokens": 197690032} +{"current_steps": 162575, "total_steps": 179580, "loss": 0.585, "lr": 1.3534895719299196e-06, "epoch": 18.106136540817463, "percentage": 90.53, "elapsed_time": "16:24:19", "remaining_time": "1:42:57", "throughput": 3347.42, "total_tokens": 197696400} +{"current_steps": 162580, "total_steps": 179580, "loss": 0.643, "lr": 1.3527010546832225e-06, "epoch": 18.10669339570108, "percentage": 90.53, "elapsed_time": "16:24:21", "remaining_time": "1:42:55", "throughput": 3347.42, "total_tokens": 197702448} +{"current_steps": 162585, "total_steps": 179580, "loss": 0.5591, "lr": 1.351912760804208e-06, "epoch": 18.1072502505847, "percentage": 90.54, "elapsed_time": "16:24:22", "remaining_time": "1:42:53", "throughput": 3347.42, "total_tokens": 197708080} +{"current_steps": 162590, "total_steps": 179580, "loss": 0.7411, "lr": 1.351124690300329e-06, "epoch": 18.107807105468314, "percentage": 90.54, "elapsed_time": "16:24:24", "remaining_time": "1:42:52", "throughput": 3347.43, "total_tokens": 197714160} +{"current_steps": 162595, "total_steps": 179580, "loss": 0.6546, "lr": 1.3503368431790176e-06, "epoch": 18.108363960351934, "percentage": 90.54, "elapsed_time": "16:24:26", "remaining_time": "1:42:50", "throughput": 3347.43, "total_tokens": 197720560} +{"current_steps": 162600, "total_steps": 179580, "loss": 0.6951, "lr": 1.3495492194477267e-06, "epoch": 18.10892081523555, "percentage": 90.54, "elapsed_time": "16:24:28", "remaining_time": "1:42:48", "throughput": 3347.44, "total_tokens": 197726864} +{"current_steps": 162605, "total_steps": 179580, "loss": 0.8632, "lr": 1.3487618191138861e-06, "epoch": 18.109477670119166, "percentage": 90.55, "elapsed_time": "16:24:29", "remaining_time": "1:42:46", "throughput": 3347.44, "total_tokens": 197732880} +{"current_steps": 162610, "total_steps": 179580, "loss": 0.8181, "lr": 1.347974642184946e-06, "epoch": 18.110034525002785, "percentage": 90.55, "elapsed_time": "16:24:31", "remaining_time": "1:42:44", "throughput": 3347.44, "total_tokens": 197739024} +{"current_steps": 162615, "total_steps": 179580, "loss": 0.7242, "lr": 1.3471876886683331e-06, "epoch": 18.1105913798864, "percentage": 90.55, "elapsed_time": "16:24:33", "remaining_time": "1:42:42", "throughput": 3347.45, "total_tokens": 197744880} +{"current_steps": 162620, "total_steps": 179580, "loss": 0.7829, "lr": 1.3464009585714838e-06, "epoch": 18.11114823477002, "percentage": 90.56, "elapsed_time": "16:24:35", "remaining_time": "1:42:41", "throughput": 3347.45, "total_tokens": 197751280} +{"current_steps": 162625, "total_steps": 179580, "loss": 0.5828, "lr": 1.3456144519018249e-06, "epoch": 18.111705089653636, "percentage": 90.56, "elapsed_time": "16:24:37", "remaining_time": "1:42:39", "throughput": 3347.45, "total_tokens": 197757744} +{"current_steps": 162630, "total_steps": 179580, "loss": 0.5465, "lr": 1.3448281686667923e-06, "epoch": 18.112261944537252, "percentage": 90.56, "elapsed_time": "16:24:38", "remaining_time": "1:42:37", "throughput": 3347.46, "total_tokens": 197764080} +{"current_steps": 162635, "total_steps": 179580, "loss": 0.7609, "lr": 1.3440421088738109e-06, "epoch": 18.11281879942087, "percentage": 90.56, "elapsed_time": "16:24:40", "remaining_time": "1:42:35", "throughput": 3347.46, "total_tokens": 197769840} +{"current_steps": 162640, "total_steps": 179580, "loss": 0.8048, "lr": 1.343256272530305e-06, "epoch": 18.113375654304487, "percentage": 90.57, "elapsed_time": "16:24:42", "remaining_time": "1:42:33", "throughput": 3347.47, "total_tokens": 197775952} +{"current_steps": 162645, "total_steps": 179580, "loss": 0.7654, "lr": 1.3424706596436909e-06, "epoch": 18.113932509188107, "percentage": 90.57, "elapsed_time": "16:24:44", "remaining_time": "1:42:31", "throughput": 3347.47, "total_tokens": 197782256} +{"current_steps": 162650, "total_steps": 179580, "loss": 0.5542, "lr": 1.3416852702213989e-06, "epoch": 18.114489364071723, "percentage": 90.57, "elapsed_time": "16:24:45", "remaining_time": "1:42:30", "throughput": 3347.47, "total_tokens": 197787568} +{"current_steps": 162655, "total_steps": 179580, "loss": 0.7258, "lr": 1.3409001042708425e-06, "epoch": 18.11504621895534, "percentage": 90.58, "elapsed_time": "16:24:47", "remaining_time": "1:42:28", "throughput": 3347.48, "total_tokens": 197793744} +{"current_steps": 162660, "total_steps": 179580, "loss": 0.7134, "lr": 1.340115161799449e-06, "epoch": 18.115603073838958, "percentage": 90.58, "elapsed_time": "16:24:49", "remaining_time": "1:42:26", "throughput": 3347.48, "total_tokens": 197799280} +{"current_steps": 162665, "total_steps": 179580, "loss": 0.6456, "lr": 1.3393304428146125e-06, "epoch": 18.116159928722574, "percentage": 90.58, "elapsed_time": "16:24:50", "remaining_time": "1:42:24", "throughput": 3347.48, "total_tokens": 197804560} +{"current_steps": 162670, "total_steps": 179580, "loss": 0.7666, "lr": 1.3385459473237632e-06, "epoch": 18.116716783606194, "percentage": 90.58, "elapsed_time": "16:24:52", "remaining_time": "1:42:22", "throughput": 3347.48, "total_tokens": 197810480} +{"current_steps": 162675, "total_steps": 179580, "loss": 0.5077, "lr": 1.337761675334301e-06, "epoch": 18.11727363848981, "percentage": 90.59, "elapsed_time": "16:24:54", "remaining_time": "1:42:20", "throughput": 3347.49, "total_tokens": 197816624} +{"current_steps": 162680, "total_steps": 179580, "loss": 0.6894, "lr": 1.3369776268536388e-06, "epoch": 18.117830493373425, "percentage": 90.59, "elapsed_time": "16:24:55", "remaining_time": "1:42:19", "throughput": 3347.49, "total_tokens": 197822672} +{"current_steps": 162685, "total_steps": 179580, "loss": 0.524, "lr": 1.3361938018891822e-06, "epoch": 18.118387348257045, "percentage": 90.59, "elapsed_time": "16:24:57", "remaining_time": "1:42:17", "throughput": 3347.49, "total_tokens": 197828592} +{"current_steps": 162690, "total_steps": 179580, "loss": 0.5653, "lr": 1.3354102004483366e-06, "epoch": 18.11894420314066, "percentage": 90.59, "elapsed_time": "16:24:59", "remaining_time": "1:42:15", "throughput": 3347.5, "total_tokens": 197834704} +{"current_steps": 162695, "total_steps": 179580, "loss": 0.7172, "lr": 1.3346268225384957e-06, "epoch": 18.11950105802428, "percentage": 90.6, "elapsed_time": "16:25:01", "remaining_time": "1:42:13", "throughput": 3347.5, "total_tokens": 197840656} +{"current_steps": 162700, "total_steps": 179580, "loss": 0.5454, "lr": 1.3338436681670674e-06, "epoch": 18.120057912907896, "percentage": 90.6, "elapsed_time": "16:25:02", "remaining_time": "1:42:11", "throughput": 3347.5, "total_tokens": 197846896} +{"current_steps": 162705, "total_steps": 179580, "loss": 0.6139, "lr": 1.333060737341449e-06, "epoch": 18.120614767791512, "percentage": 90.6, "elapsed_time": "16:25:04", "remaining_time": "1:42:10", "throughput": 3347.51, "total_tokens": 197852752} +{"current_steps": 162710, "total_steps": 179580, "loss": 0.6351, "lr": 1.3322780300690313e-06, "epoch": 18.12117162267513, "percentage": 90.61, "elapsed_time": "16:25:06", "remaining_time": "1:42:08", "throughput": 3347.51, "total_tokens": 197858672} +{"current_steps": 162715, "total_steps": 179580, "loss": 0.6451, "lr": 1.3314955463572088e-06, "epoch": 18.121728477558747, "percentage": 90.61, "elapsed_time": "16:25:08", "remaining_time": "1:42:06", "throughput": 3347.51, "total_tokens": 197864944} +{"current_steps": 162720, "total_steps": 179580, "loss": 0.7836, "lr": 1.3307132862133754e-06, "epoch": 18.122285332442367, "percentage": 90.61, "elapsed_time": "16:25:09", "remaining_time": "1:42:04", "throughput": 3347.52, "total_tokens": 197871408} +{"current_steps": 162725, "total_steps": 179580, "loss": 0.6767, "lr": 1.3299312496449168e-06, "epoch": 18.122842187325983, "percentage": 90.61, "elapsed_time": "16:25:11", "remaining_time": "1:42:02", "throughput": 3347.52, "total_tokens": 197877616} +{"current_steps": 162730, "total_steps": 179580, "loss": 0.7511, "lr": 1.3291494366592272e-06, "epoch": 18.1233990422096, "percentage": 90.62, "elapsed_time": "16:25:13", "remaining_time": "1:42:00", "throughput": 3347.52, "total_tokens": 197883696} +{"current_steps": 162735, "total_steps": 179580, "loss": 0.8163, "lr": 1.3283678472636784e-06, "epoch": 18.123955897093218, "percentage": 90.62, "elapsed_time": "16:25:15", "remaining_time": "1:41:59", "throughput": 3347.53, "total_tokens": 197890256} +{"current_steps": 162740, "total_steps": 179580, "loss": 0.4764, "lr": 1.3275864814656674e-06, "epoch": 18.124512751976834, "percentage": 90.62, "elapsed_time": "16:25:17", "remaining_time": "1:41:57", "throughput": 3347.53, "total_tokens": 197896112} +{"current_steps": 162745, "total_steps": 179580, "loss": 0.5959, "lr": 1.3268053392725605e-06, "epoch": 18.125069606860453, "percentage": 90.63, "elapsed_time": "16:25:18", "remaining_time": "1:41:55", "throughput": 3347.54, "total_tokens": 197902320} +{"current_steps": 162750, "total_steps": 179580, "loss": 0.5744, "lr": 1.3260244206917489e-06, "epoch": 18.12562646174407, "percentage": 90.63, "elapsed_time": "16:25:20", "remaining_time": "1:41:53", "throughput": 3347.54, "total_tokens": 197908816} +{"current_steps": 162755, "total_steps": 179580, "loss": 0.7906, "lr": 1.3252437257306044e-06, "epoch": 18.126183316627685, "percentage": 90.63, "elapsed_time": "16:25:22", "remaining_time": "1:41:51", "throughput": 3347.55, "total_tokens": 197915088} +{"current_steps": 162760, "total_steps": 179580, "loss": 0.5644, "lr": 1.324463254396502e-06, "epoch": 18.126740171511305, "percentage": 90.63, "elapsed_time": "16:25:24", "remaining_time": "1:41:50", "throughput": 3347.55, "total_tokens": 197921200} +{"current_steps": 162765, "total_steps": 179580, "loss": 0.6262, "lr": 1.3236830066968075e-06, "epoch": 18.12729702639492, "percentage": 90.64, "elapsed_time": "16:25:25", "remaining_time": "1:41:48", "throughput": 3347.55, "total_tokens": 197927248} +{"current_steps": 162770, "total_steps": 179580, "loss": 0.6956, "lr": 1.3229029826388988e-06, "epoch": 18.12785388127854, "percentage": 90.64, "elapsed_time": "16:25:27", "remaining_time": "1:41:46", "throughput": 3347.56, "total_tokens": 197933584} +{"current_steps": 162775, "total_steps": 179580, "loss": 0.6065, "lr": 1.322123182230145e-06, "epoch": 18.128410736162156, "percentage": 90.64, "elapsed_time": "16:25:29", "remaining_time": "1:41:44", "throughput": 3347.56, "total_tokens": 197939728} +{"current_steps": 162780, "total_steps": 179580, "loss": 0.7616, "lr": 1.3213436054779039e-06, "epoch": 18.12896759104577, "percentage": 90.64, "elapsed_time": "16:25:31", "remaining_time": "1:41:42", "throughput": 3347.56, "total_tokens": 197945616} +{"current_steps": 162785, "total_steps": 179580, "loss": 0.6769, "lr": 1.3205642523895418e-06, "epoch": 18.12952444592939, "percentage": 90.65, "elapsed_time": "16:25:33", "remaining_time": "1:41:40", "throughput": 3347.57, "total_tokens": 197951920} +{"current_steps": 162790, "total_steps": 179580, "loss": 0.6447, "lr": 1.319785122972425e-06, "epoch": 18.130081300813007, "percentage": 90.65, "elapsed_time": "16:25:34", "remaining_time": "1:41:39", "throughput": 3347.57, "total_tokens": 197958416} +{"current_steps": 162795, "total_steps": 179580, "loss": 0.7095, "lr": 1.3190062172339062e-06, "epoch": 18.130638155696627, "percentage": 90.65, "elapsed_time": "16:25:36", "remaining_time": "1:41:37", "throughput": 3347.58, "total_tokens": 197964560} +{"current_steps": 162800, "total_steps": 179580, "loss": 0.9898, "lr": 1.3182275351813516e-06, "epoch": 18.131195010580242, "percentage": 90.66, "elapsed_time": "16:25:38", "remaining_time": "1:41:35", "throughput": 3347.58, "total_tokens": 197970736} +{"current_steps": 162805, "total_steps": 179580, "loss": 0.6829, "lr": 1.317449076822111e-06, "epoch": 18.131751865463862, "percentage": 90.66, "elapsed_time": "16:25:40", "remaining_time": "1:41:33", "throughput": 3347.59, "total_tokens": 197977136} +{"current_steps": 162810, "total_steps": 179580, "loss": 0.758, "lr": 1.3166708421635366e-06, "epoch": 18.132308720347478, "percentage": 90.66, "elapsed_time": "16:25:41", "remaining_time": "1:41:31", "throughput": 3347.59, "total_tokens": 197983088} +{"current_steps": 162815, "total_steps": 179580, "loss": 0.7741, "lr": 1.315892831212978e-06, "epoch": 18.132865575231094, "percentage": 90.66, "elapsed_time": "16:25:43", "remaining_time": "1:41:30", "throughput": 3347.59, "total_tokens": 197989168} +{"current_steps": 162820, "total_steps": 179580, "loss": 0.6662, "lr": 1.3151150439777909e-06, "epoch": 18.133422430114713, "percentage": 90.67, "elapsed_time": "16:25:45", "remaining_time": "1:41:28", "throughput": 3347.6, "total_tokens": 197995504} +{"current_steps": 162825, "total_steps": 179580, "loss": 0.6932, "lr": 1.314337480465319e-06, "epoch": 18.13397928499833, "percentage": 90.67, "elapsed_time": "16:25:47", "remaining_time": "1:41:26", "throughput": 3347.6, "total_tokens": 198001616} +{"current_steps": 162830, "total_steps": 179580, "loss": 0.5923, "lr": 1.313560140682904e-06, "epoch": 18.13453613988195, "percentage": 90.67, "elapsed_time": "16:25:49", "remaining_time": "1:41:24", "throughput": 3347.6, "total_tokens": 198007600} +{"current_steps": 162835, "total_steps": 179580, "loss": 0.7737, "lr": 1.3127830246378897e-06, "epoch": 18.135092994765564, "percentage": 90.68, "elapsed_time": "16:25:50", "remaining_time": "1:41:22", "throughput": 3347.61, "total_tokens": 198013744} +{"current_steps": 162840, "total_steps": 179580, "loss": 0.5473, "lr": 1.3120061323376205e-06, "epoch": 18.13564984964918, "percentage": 90.68, "elapsed_time": "16:25:52", "remaining_time": "1:41:20", "throughput": 3347.61, "total_tokens": 198019696} +{"current_steps": 162845, "total_steps": 179580, "loss": 0.7492, "lr": 1.3112294637894263e-06, "epoch": 18.1362067045328, "percentage": 90.68, "elapsed_time": "16:25:54", "remaining_time": "1:41:19", "throughput": 3347.61, "total_tokens": 198025296} +{"current_steps": 162850, "total_steps": 179580, "loss": 0.5686, "lr": 1.310453019000657e-06, "epoch": 18.136763559416416, "percentage": 90.68, "elapsed_time": "16:25:55", "remaining_time": "1:41:17", "throughput": 3347.62, "total_tokens": 198031152} +{"current_steps": 162855, "total_steps": 179580, "loss": 0.5484, "lr": 1.3096767979786345e-06, "epoch": 18.137320414300035, "percentage": 90.69, "elapsed_time": "16:25:57", "remaining_time": "1:41:15", "throughput": 3347.62, "total_tokens": 198037520} +{"current_steps": 162860, "total_steps": 179580, "loss": 0.7613, "lr": 1.3089008007306947e-06, "epoch": 18.13787726918365, "percentage": 90.69, "elapsed_time": "16:25:59", "remaining_time": "1:41:13", "throughput": 3347.62, "total_tokens": 198043920} +{"current_steps": 162865, "total_steps": 179580, "loss": 0.6848, "lr": 1.3081250272641649e-06, "epoch": 18.138434124067267, "percentage": 90.69, "elapsed_time": "16:26:01", "remaining_time": "1:41:11", "throughput": 3347.63, "total_tokens": 198049648} +{"current_steps": 162870, "total_steps": 179580, "loss": 0.9403, "lr": 1.307349477586381e-06, "epoch": 18.138990978950886, "percentage": 90.69, "elapsed_time": "16:26:02", "remaining_time": "1:41:09", "throughput": 3347.63, "total_tokens": 198055824} +{"current_steps": 162875, "total_steps": 179580, "loss": 0.5435, "lr": 1.306574151704662e-06, "epoch": 18.139547833834502, "percentage": 90.7, "elapsed_time": "16:26:04", "remaining_time": "1:41:08", "throughput": 3347.64, "total_tokens": 198061808} +{"current_steps": 162880, "total_steps": 179580, "loss": 0.5735, "lr": 1.3057990496263357e-06, "epoch": 18.14010468871812, "percentage": 90.7, "elapsed_time": "16:26:06", "remaining_time": "1:41:06", "throughput": 3347.64, "total_tokens": 198067984} +{"current_steps": 162885, "total_steps": 179580, "loss": 0.8664, "lr": 1.3050241713587152e-06, "epoch": 18.140661543601738, "percentage": 90.7, "elapsed_time": "16:26:08", "remaining_time": "1:41:04", "throughput": 3347.64, "total_tokens": 198073936} +{"current_steps": 162890, "total_steps": 179580, "loss": 0.6653, "lr": 1.3042495169091285e-06, "epoch": 18.141218398485353, "percentage": 90.71, "elapsed_time": "16:26:09", "remaining_time": "1:41:02", "throughput": 3347.65, "total_tokens": 198080144} +{"current_steps": 162895, "total_steps": 179580, "loss": 0.7458, "lr": 1.3034750862848916e-06, "epoch": 18.141775253368973, "percentage": 90.71, "elapsed_time": "16:26:11", "remaining_time": "1:41:00", "throughput": 3347.65, "total_tokens": 198086160} +{"current_steps": 162900, "total_steps": 179580, "loss": 0.7954, "lr": 1.3027008794933155e-06, "epoch": 18.14233210825259, "percentage": 90.71, "elapsed_time": "16:26:13", "remaining_time": "1:40:59", "throughput": 3347.65, "total_tokens": 198091888} +{"current_steps": 162905, "total_steps": 179580, "loss": 0.5425, "lr": 1.3019268965417165e-06, "epoch": 18.14288896313621, "percentage": 90.71, "elapsed_time": "16:26:15", "remaining_time": "1:40:57", "throughput": 3347.66, "total_tokens": 198098288} +{"current_steps": 162910, "total_steps": 179580, "loss": 0.7635, "lr": 1.3011531374374026e-06, "epoch": 18.143445818019824, "percentage": 90.72, "elapsed_time": "16:26:16", "remaining_time": "1:40:55", "throughput": 3347.66, "total_tokens": 198104144} +{"current_steps": 162915, "total_steps": 179580, "loss": 0.7028, "lr": 1.3003796021876875e-06, "epoch": 18.14400267290344, "percentage": 90.72, "elapsed_time": "16:26:18", "remaining_time": "1:40:53", "throughput": 3347.66, "total_tokens": 198110160} +{"current_steps": 162920, "total_steps": 179580, "loss": 0.5096, "lr": 1.2996062907998735e-06, "epoch": 18.14455952778706, "percentage": 90.72, "elapsed_time": "16:26:20", "remaining_time": "1:40:51", "throughput": 3347.67, "total_tokens": 198116304} +{"current_steps": 162925, "total_steps": 179580, "loss": 1.0418, "lr": 1.2988332032812662e-06, "epoch": 18.145116382670675, "percentage": 90.73, "elapsed_time": "16:26:22", "remaining_time": "1:40:49", "throughput": 3347.67, "total_tokens": 198122512} +{"current_steps": 162930, "total_steps": 179580, "loss": 0.78, "lr": 1.2980603396391678e-06, "epoch": 18.145673237554295, "percentage": 90.73, "elapsed_time": "16:26:24", "remaining_time": "1:40:48", "throughput": 3347.67, "total_tokens": 198128656} +{"current_steps": 162935, "total_steps": 179580, "loss": 0.5885, "lr": 1.297287699880878e-06, "epoch": 18.14623009243791, "percentage": 90.73, "elapsed_time": "16:26:25", "remaining_time": "1:40:46", "throughput": 3347.67, "total_tokens": 198134672} +{"current_steps": 162940, "total_steps": 179580, "loss": 0.7244, "lr": 1.296515284013697e-06, "epoch": 18.146786947321527, "percentage": 90.73, "elapsed_time": "16:26:27", "remaining_time": "1:40:44", "throughput": 3347.68, "total_tokens": 198140752} +{"current_steps": 162945, "total_steps": 179580, "loss": 0.8226, "lr": 1.2957430920449266e-06, "epoch": 18.147343802205146, "percentage": 90.74, "elapsed_time": "16:26:29", "remaining_time": "1:40:42", "throughput": 3347.68, "total_tokens": 198146960} +{"current_steps": 162950, "total_steps": 179580, "loss": 0.7583, "lr": 1.2949711239818447e-06, "epoch": 18.147900657088762, "percentage": 90.74, "elapsed_time": "16:26:30", "remaining_time": "1:40:40", "throughput": 3347.69, "total_tokens": 198152944} +{"current_steps": 162955, "total_steps": 179580, "loss": 0.5245, "lr": 1.2941993798317565e-06, "epoch": 18.14845751197238, "percentage": 90.74, "elapsed_time": "16:26:32", "remaining_time": "1:40:38", "throughput": 3347.69, "total_tokens": 198159280} +{"current_steps": 162960, "total_steps": 179580, "loss": 0.5146, "lr": 1.2934278596019477e-06, "epoch": 18.149014366855997, "percentage": 90.75, "elapsed_time": "16:26:34", "remaining_time": "1:40:37", "throughput": 3347.69, "total_tokens": 198165200} +{"current_steps": 162965, "total_steps": 179580, "loss": 1.1427, "lr": 1.2926565632997074e-06, "epoch": 18.149571221739613, "percentage": 90.75, "elapsed_time": "16:26:36", "remaining_time": "1:40:35", "throughput": 3347.7, "total_tokens": 198171440} +{"current_steps": 162970, "total_steps": 179580, "loss": 0.7333, "lr": 1.2918854909323181e-06, "epoch": 18.150128076623233, "percentage": 90.75, "elapsed_time": "16:26:38", "remaining_time": "1:40:33", "throughput": 3347.7, "total_tokens": 198177392} +{"current_steps": 162975, "total_steps": 179580, "loss": 0.7679, "lr": 1.2911146425070686e-06, "epoch": 18.15068493150685, "percentage": 90.75, "elapsed_time": "16:26:39", "remaining_time": "1:40:31", "throughput": 3347.71, "total_tokens": 198183504} +{"current_steps": 162980, "total_steps": 179580, "loss": 0.6555, "lr": 1.290344018031231e-06, "epoch": 18.151241786390468, "percentage": 90.76, "elapsed_time": "16:26:41", "remaining_time": "1:40:29", "throughput": 3347.71, "total_tokens": 198189616} +{"current_steps": 162985, "total_steps": 179580, "loss": 0.7771, "lr": 1.2895736175120937e-06, "epoch": 18.151798641274084, "percentage": 90.76, "elapsed_time": "16:26:43", "remaining_time": "1:40:28", "throughput": 3347.71, "total_tokens": 198195888} +{"current_steps": 162990, "total_steps": 179580, "loss": 0.5941, "lr": 1.288803440956929e-06, "epoch": 18.1523554961577, "percentage": 90.76, "elapsed_time": "16:26:45", "remaining_time": "1:40:26", "throughput": 3347.72, "total_tokens": 198201808} +{"current_steps": 162995, "total_steps": 179580, "loss": 0.7087, "lr": 1.2880334883730137e-06, "epoch": 18.15291235104132, "percentage": 90.76, "elapsed_time": "16:26:46", "remaining_time": "1:40:24", "throughput": 3347.72, "total_tokens": 198208272} +{"current_steps": 163000, "total_steps": 179580, "loss": 0.5765, "lr": 1.287263759767618e-06, "epoch": 18.153469205924935, "percentage": 90.77, "elapsed_time": "16:26:48", "remaining_time": "1:40:22", "throughput": 3347.72, "total_tokens": 198214256} +{"current_steps": 163005, "total_steps": 179580, "loss": 0.6305, "lr": 1.2864942551480157e-06, "epoch": 18.154026060808555, "percentage": 90.77, "elapsed_time": "16:26:50", "remaining_time": "1:40:20", "throughput": 3347.73, "total_tokens": 198220560} +{"current_steps": 163010, "total_steps": 179580, "loss": 0.8688, "lr": 1.2857249745214712e-06, "epoch": 18.15458291569217, "percentage": 90.77, "elapsed_time": "16:26:52", "remaining_time": "1:40:18", "throughput": 3347.73, "total_tokens": 198226864} +{"current_steps": 163015, "total_steps": 179580, "loss": 0.664, "lr": 1.2849559178952586e-06, "epoch": 18.155139770575786, "percentage": 90.78, "elapsed_time": "16:26:54", "remaining_time": "1:40:17", "throughput": 3347.74, "total_tokens": 198232912} +{"current_steps": 163020, "total_steps": 179580, "loss": 0.5921, "lr": 1.2841870852766363e-06, "epoch": 18.155696625459406, "percentage": 90.78, "elapsed_time": "16:26:55", "remaining_time": "1:40:15", "throughput": 3347.74, "total_tokens": 198238864} +{"current_steps": 163025, "total_steps": 179580, "loss": 0.649, "lr": 1.283418476672868e-06, "epoch": 18.156253480343022, "percentage": 90.78, "elapsed_time": "16:26:57", "remaining_time": "1:40:13", "throughput": 3347.74, "total_tokens": 198245008} +{"current_steps": 163030, "total_steps": 179580, "loss": 0.8111, "lr": 1.2826500920912087e-06, "epoch": 18.15681033522664, "percentage": 90.78, "elapsed_time": "16:26:59", "remaining_time": "1:40:11", "throughput": 3347.75, "total_tokens": 198250480} +{"current_steps": 163035, "total_steps": 179580, "loss": 0.7411, "lr": 1.281881931538928e-06, "epoch": 18.157367190110257, "percentage": 90.79, "elapsed_time": "16:27:00", "remaining_time": "1:40:09", "throughput": 3347.75, "total_tokens": 198256336} +{"current_steps": 163040, "total_steps": 179580, "loss": 0.6292, "lr": 1.2811139950232726e-06, "epoch": 18.157924044993873, "percentage": 90.79, "elapsed_time": "16:27:02", "remaining_time": "1:40:07", "throughput": 3347.75, "total_tokens": 198262576} +{"current_steps": 163045, "total_steps": 179580, "loss": 0.6816, "lr": 1.2803462825514979e-06, "epoch": 18.158480899877492, "percentage": 90.79, "elapsed_time": "16:27:04", "remaining_time": "1:40:06", "throughput": 3347.76, "total_tokens": 198268752} +{"current_steps": 163050, "total_steps": 179580, "loss": 0.8475, "lr": 1.2795787941308562e-06, "epoch": 18.15903775476111, "percentage": 90.8, "elapsed_time": "16:27:06", "remaining_time": "1:40:04", "throughput": 3347.76, "total_tokens": 198274864} +{"current_steps": 163055, "total_steps": 179580, "loss": 0.5988, "lr": 1.2788115297685976e-06, "epoch": 18.159594609644728, "percentage": 90.8, "elapsed_time": "16:27:07", "remaining_time": "1:40:02", "throughput": 3347.76, "total_tokens": 198280912} +{"current_steps": 163060, "total_steps": 179580, "loss": 0.6786, "lr": 1.2780444894719689e-06, "epoch": 18.160151464528344, "percentage": 90.8, "elapsed_time": "16:27:09", "remaining_time": "1:40:00", "throughput": 3347.77, "total_tokens": 198286992} +{"current_steps": 163065, "total_steps": 179580, "loss": 0.6273, "lr": 1.27727767324822e-06, "epoch": 18.16070831941196, "percentage": 90.8, "elapsed_time": "16:27:11", "remaining_time": "1:39:58", "throughput": 3347.77, "total_tokens": 198293392} +{"current_steps": 163070, "total_steps": 179580, "loss": 0.5544, "lr": 1.2765110811045838e-06, "epoch": 18.16126517429558, "percentage": 90.81, "elapsed_time": "16:27:13", "remaining_time": "1:39:57", "throughput": 3347.77, "total_tokens": 198299664} +{"current_steps": 163075, "total_steps": 179580, "loss": 0.9042, "lr": 1.2757447130483103e-06, "epoch": 18.161822029179195, "percentage": 90.81, "elapsed_time": "16:27:15", "remaining_time": "1:39:55", "throughput": 3347.78, "total_tokens": 198305744} +{"current_steps": 163080, "total_steps": 179580, "loss": 0.7591, "lr": 1.2749785690866324e-06, "epoch": 18.162378884062814, "percentage": 90.81, "elapsed_time": "16:27:16", "remaining_time": "1:39:53", "throughput": 3347.78, "total_tokens": 198311888} +{"current_steps": 163085, "total_steps": 179580, "loss": 0.7653, "lr": 1.2742126492267942e-06, "epoch": 18.16293573894643, "percentage": 90.81, "elapsed_time": "16:27:18", "remaining_time": "1:39:51", "throughput": 3347.79, "total_tokens": 198317744} +{"current_steps": 163090, "total_steps": 179580, "loss": 0.6307, "lr": 1.2734469534760263e-06, "epoch": 18.163492593830046, "percentage": 90.82, "elapsed_time": "16:27:20", "remaining_time": "1:39:49", "throughput": 3347.79, "total_tokens": 198323920} +{"current_steps": 163095, "total_steps": 179580, "loss": 0.8007, "lr": 1.2726814818415617e-06, "epoch": 18.164049448713666, "percentage": 90.82, "elapsed_time": "16:27:22", "remaining_time": "1:39:47", "throughput": 3347.79, "total_tokens": 198330096} +{"current_steps": 163100, "total_steps": 179580, "loss": 0.6372, "lr": 1.2719162343306252e-06, "epoch": 18.16460630359728, "percentage": 90.82, "elapsed_time": "16:27:23", "remaining_time": "1:39:46", "throughput": 3347.8, "total_tokens": 198336208} +{"current_steps": 163105, "total_steps": 179580, "loss": 0.8391, "lr": 1.2711512109504553e-06, "epoch": 18.1651631584809, "percentage": 90.83, "elapsed_time": "16:27:25", "remaining_time": "1:39:44", "throughput": 3347.8, "total_tokens": 198342736} +{"current_steps": 163110, "total_steps": 179580, "loss": 0.9982, "lr": 1.2703864117082742e-06, "epoch": 18.165720013364517, "percentage": 90.83, "elapsed_time": "16:27:27", "remaining_time": "1:39:42", "throughput": 3347.8, "total_tokens": 198348688} +{"current_steps": 163115, "total_steps": 179580, "loss": 0.5796, "lr": 1.2696218366113038e-06, "epoch": 18.166276868248133, "percentage": 90.83, "elapsed_time": "16:27:29", "remaining_time": "1:39:40", "throughput": 3347.81, "total_tokens": 198354800} +{"current_steps": 163120, "total_steps": 179580, "loss": 0.7948, "lr": 1.2688574856667635e-06, "epoch": 18.166833723131752, "percentage": 90.83, "elapsed_time": "16:27:30", "remaining_time": "1:39:38", "throughput": 3347.81, "total_tokens": 198360688} +{"current_steps": 163125, "total_steps": 179580, "loss": 0.6176, "lr": 1.2680933588818833e-06, "epoch": 18.167390578015368, "percentage": 90.84, "elapsed_time": "16:27:32", "remaining_time": "1:39:37", "throughput": 3347.82, "total_tokens": 198366832} +{"current_steps": 163130, "total_steps": 179580, "loss": 0.8551, "lr": 1.2673294562638688e-06, "epoch": 18.167947432898988, "percentage": 90.84, "elapsed_time": "16:27:34", "remaining_time": "1:39:35", "throughput": 3347.82, "total_tokens": 198372560} +{"current_steps": 163135, "total_steps": 179580, "loss": 0.9339, "lr": 1.2665657778199503e-06, "epoch": 18.168504287782604, "percentage": 90.84, "elapsed_time": "16:27:35", "remaining_time": "1:39:33", "throughput": 3347.82, "total_tokens": 198378544} +{"current_steps": 163140, "total_steps": 179580, "loss": 0.6973, "lr": 1.2658023235573274e-06, "epoch": 18.169061142666223, "percentage": 90.85, "elapsed_time": "16:27:37", "remaining_time": "1:39:31", "throughput": 3347.82, "total_tokens": 198384496} +{"current_steps": 163145, "total_steps": 179580, "loss": 0.8827, "lr": 1.2650390934832168e-06, "epoch": 18.16961799754984, "percentage": 90.85, "elapsed_time": "16:27:39", "remaining_time": "1:39:29", "throughput": 3347.83, "total_tokens": 198390800} +{"current_steps": 163150, "total_steps": 179580, "loss": 0.8566, "lr": 1.2642760876048293e-06, "epoch": 18.170174852433455, "percentage": 90.85, "elapsed_time": "16:27:41", "remaining_time": "1:39:27", "throughput": 3347.83, "total_tokens": 198396976} +{"current_steps": 163155, "total_steps": 179580, "loss": 0.6566, "lr": 1.2635133059293702e-06, "epoch": 18.170731707317074, "percentage": 90.85, "elapsed_time": "16:27:43", "remaining_time": "1:39:26", "throughput": 3347.84, "total_tokens": 198403344} +{"current_steps": 163160, "total_steps": 179580, "loss": 0.5538, "lr": 1.2627507484640477e-06, "epoch": 18.17128856220069, "percentage": 90.86, "elapsed_time": "16:27:45", "remaining_time": "1:39:24", "throughput": 3347.84, "total_tokens": 198409872} +{"current_steps": 163165, "total_steps": 179580, "loss": 0.7543, "lr": 1.2619884152160615e-06, "epoch": 18.17184541708431, "percentage": 90.86, "elapsed_time": "16:27:46", "remaining_time": "1:39:22", "throughput": 3347.84, "total_tokens": 198415792} +{"current_steps": 163170, "total_steps": 179580, "loss": 0.5379, "lr": 1.2612263061926087e-06, "epoch": 18.172402271967925, "percentage": 90.86, "elapsed_time": "16:27:48", "remaining_time": "1:39:20", "throughput": 3347.85, "total_tokens": 198422352} +{"current_steps": 163175, "total_steps": 179580, "loss": 0.6145, "lr": 1.2604644214008976e-06, "epoch": 18.17295912685154, "percentage": 90.86, "elapsed_time": "16:27:50", "remaining_time": "1:39:18", "throughput": 3347.85, "total_tokens": 198427984} +{"current_steps": 163180, "total_steps": 179580, "loss": 0.7719, "lr": 1.2597027608481193e-06, "epoch": 18.17351598173516, "percentage": 90.87, "elapsed_time": "16:27:51", "remaining_time": "1:39:16", "throughput": 3347.86, "total_tokens": 198433968} +{"current_steps": 163185, "total_steps": 179580, "loss": 0.6516, "lr": 1.258941324541471e-06, "epoch": 18.174072836618777, "percentage": 90.87, "elapsed_time": "16:27:53", "remaining_time": "1:39:15", "throughput": 3347.86, "total_tokens": 198439888} +{"current_steps": 163190, "total_steps": 179580, "loss": 0.8633, "lr": 1.258180112488136e-06, "epoch": 18.174629691502396, "percentage": 90.87, "elapsed_time": "16:27:55", "remaining_time": "1:39:13", "throughput": 3347.86, "total_tokens": 198445936} +{"current_steps": 163195, "total_steps": 179580, "loss": 0.6522, "lr": 1.2574191246953166e-06, "epoch": 18.175186546386012, "percentage": 90.88, "elapsed_time": "16:27:57", "remaining_time": "1:39:11", "throughput": 3347.86, "total_tokens": 198452496} +{"current_steps": 163200, "total_steps": 179580, "loss": 1.1007, "lr": 1.2566583611701933e-06, "epoch": 18.175743401269628, "percentage": 90.88, "elapsed_time": "16:27:59", "remaining_time": "1:39:09", "throughput": 3347.86, "total_tokens": 198458768} +{"current_steps": 163205, "total_steps": 179580, "loss": 0.8995, "lr": 1.2558978219199573e-06, "epoch": 18.176300256153247, "percentage": 90.88, "elapsed_time": "16:28:01", "remaining_time": "1:39:07", "throughput": 3347.86, "total_tokens": 198464976} +{"current_steps": 163210, "total_steps": 179580, "loss": 0.6726, "lr": 1.2551375069517895e-06, "epoch": 18.176857111036863, "percentage": 90.88, "elapsed_time": "16:28:02", "remaining_time": "1:39:06", "throughput": 3347.87, "total_tokens": 198470576} +{"current_steps": 163215, "total_steps": 179580, "loss": 0.7466, "lr": 1.2543774162728728e-06, "epoch": 18.177413965920483, "percentage": 90.89, "elapsed_time": "16:28:04", "remaining_time": "1:39:04", "throughput": 3347.87, "total_tokens": 198476688} +{"current_steps": 163220, "total_steps": 179580, "loss": 0.7118, "lr": 1.2536175498903817e-06, "epoch": 18.1779708208041, "percentage": 90.89, "elapsed_time": "16:28:06", "remaining_time": "1:39:02", "throughput": 3347.88, "total_tokens": 198482992} +{"current_steps": 163225, "total_steps": 179580, "loss": 0.4939, "lr": 1.2528579078115e-06, "epoch": 18.178527675687715, "percentage": 90.89, "elapsed_time": "16:28:07", "remaining_time": "1:39:00", "throughput": 3347.88, "total_tokens": 198488816} +{"current_steps": 163230, "total_steps": 179580, "loss": 0.8567, "lr": 1.2520984900434046e-06, "epoch": 18.179084530571334, "percentage": 90.9, "elapsed_time": "16:28:09", "remaining_time": "1:38:58", "throughput": 3347.88, "total_tokens": 198494384} +{"current_steps": 163235, "total_steps": 179580, "loss": 0.7731, "lr": 1.2513392965932625e-06, "epoch": 18.17964138545495, "percentage": 90.9, "elapsed_time": "16:28:11", "remaining_time": "1:38:56", "throughput": 3347.89, "total_tokens": 198500624} +{"current_steps": 163240, "total_steps": 179580, "loss": 0.5256, "lr": 1.2505803274682454e-06, "epoch": 18.18019824033857, "percentage": 90.9, "elapsed_time": "16:28:13", "remaining_time": "1:38:55", "throughput": 3347.89, "total_tokens": 198506544} +{"current_steps": 163245, "total_steps": 179580, "loss": 0.7801, "lr": 1.2498215826755283e-06, "epoch": 18.180755095222185, "percentage": 90.9, "elapsed_time": "16:28:14", "remaining_time": "1:38:53", "throughput": 3347.89, "total_tokens": 198512784} +{"current_steps": 163250, "total_steps": 179580, "loss": 0.8045, "lr": 1.2490630622222721e-06, "epoch": 18.1813119501058, "percentage": 90.91, "elapsed_time": "16:28:16", "remaining_time": "1:38:51", "throughput": 3347.89, "total_tokens": 198518608} +{"current_steps": 163255, "total_steps": 179580, "loss": 0.7059, "lr": 1.2483047661156517e-06, "epoch": 18.18186880498942, "percentage": 90.91, "elapsed_time": "16:28:18", "remaining_time": "1:38:49", "throughput": 3347.9, "total_tokens": 198524592} +{"current_steps": 163260, "total_steps": 179580, "loss": 0.639, "lr": 1.247546694362814e-06, "epoch": 18.182425659873036, "percentage": 90.91, "elapsed_time": "16:28:19", "remaining_time": "1:38:47", "throughput": 3347.9, "total_tokens": 198530128} +{"current_steps": 163265, "total_steps": 179580, "loss": 0.9037, "lr": 1.246788846970931e-06, "epoch": 18.182982514756656, "percentage": 90.91, "elapsed_time": "16:28:21", "remaining_time": "1:38:45", "throughput": 3347.9, "total_tokens": 198536176} +{"current_steps": 163270, "total_steps": 179580, "loss": 0.794, "lr": 1.2460312239471555e-06, "epoch": 18.183539369640272, "percentage": 90.92, "elapsed_time": "16:28:23", "remaining_time": "1:38:44", "throughput": 3347.91, "total_tokens": 198542352} +{"current_steps": 163275, "total_steps": 179580, "loss": 0.9703, "lr": 1.2452738252986513e-06, "epoch": 18.184096224523888, "percentage": 90.92, "elapsed_time": "16:28:25", "remaining_time": "1:38:42", "throughput": 3347.91, "total_tokens": 198548240} +{"current_steps": 163280, "total_steps": 179580, "loss": 0.7526, "lr": 1.244516651032565e-06, "epoch": 18.184653079407507, "percentage": 90.92, "elapsed_time": "16:28:26", "remaining_time": "1:38:40", "throughput": 3347.91, "total_tokens": 198554192} +{"current_steps": 163285, "total_steps": 179580, "loss": 0.9592, "lr": 1.2437597011560526e-06, "epoch": 18.185209934291123, "percentage": 90.93, "elapsed_time": "16:28:28", "remaining_time": "1:38:38", "throughput": 3347.91, "total_tokens": 198560304} +{"current_steps": 163290, "total_steps": 179580, "loss": 0.5757, "lr": 1.2430029756762606e-06, "epoch": 18.185766789174743, "percentage": 90.93, "elapsed_time": "16:28:30", "remaining_time": "1:38:36", "throughput": 3347.92, "total_tokens": 198566416} +{"current_steps": 163295, "total_steps": 179580, "loss": 0.8321, "lr": 1.242246474600342e-06, "epoch": 18.18632364405836, "percentage": 90.93, "elapsed_time": "16:28:32", "remaining_time": "1:38:35", "throughput": 3347.92, "total_tokens": 198572464} +{"current_steps": 163300, "total_steps": 179580, "loss": 0.918, "lr": 1.2414901979354382e-06, "epoch": 18.186880498941974, "percentage": 90.93, "elapsed_time": "16:28:33", "remaining_time": "1:38:33", "throughput": 3347.92, "total_tokens": 198578768} +{"current_steps": 163305, "total_steps": 179580, "loss": 0.7436, "lr": 1.2407341456886961e-06, "epoch": 18.187437353825594, "percentage": 90.94, "elapsed_time": "16:28:35", "remaining_time": "1:38:31", "throughput": 3347.93, "total_tokens": 198584784} +{"current_steps": 163310, "total_steps": 179580, "loss": 0.8952, "lr": 1.2399783178672548e-06, "epoch": 18.18799420870921, "percentage": 90.94, "elapsed_time": "16:28:37", "remaining_time": "1:38:29", "throughput": 3347.93, "total_tokens": 198590800} +{"current_steps": 163315, "total_steps": 179580, "loss": 0.6663, "lr": 1.2392227144782525e-06, "epoch": 18.18855106359283, "percentage": 90.94, "elapsed_time": "16:28:39", "remaining_time": "1:38:27", "throughput": 3347.93, "total_tokens": 198596656} +{"current_steps": 163320, "total_steps": 179580, "loss": 0.9544, "lr": 1.2384673355288311e-06, "epoch": 18.189107918476445, "percentage": 90.95, "elapsed_time": "16:28:40", "remaining_time": "1:38:25", "throughput": 3347.94, "total_tokens": 198602960} +{"current_steps": 163325, "total_steps": 179580, "loss": 0.7002, "lr": 1.2377121810261238e-06, "epoch": 18.18966477336006, "percentage": 90.95, "elapsed_time": "16:28:42", "remaining_time": "1:38:24", "throughput": 3347.94, "total_tokens": 198609488} +{"current_steps": 163330, "total_steps": 179580, "loss": 1.0167, "lr": 1.236957250977261e-06, "epoch": 18.19022162824368, "percentage": 90.95, "elapsed_time": "16:28:44", "remaining_time": "1:38:22", "throughput": 3347.95, "total_tokens": 198615536} +{"current_steps": 163335, "total_steps": 179580, "loss": 0.7142, "lr": 1.2362025453893755e-06, "epoch": 18.190778483127296, "percentage": 90.95, "elapsed_time": "16:28:46", "remaining_time": "1:38:20", "throughput": 3347.95, "total_tokens": 198621776} +{"current_steps": 163340, "total_steps": 179580, "loss": 0.7529, "lr": 1.2354480642695982e-06, "epoch": 18.191335338010916, "percentage": 90.96, "elapsed_time": "16:28:48", "remaining_time": "1:38:18", "throughput": 3347.95, "total_tokens": 198628080} +{"current_steps": 163345, "total_steps": 179580, "loss": 0.6762, "lr": 1.234693807625048e-06, "epoch": 18.19189219289453, "percentage": 90.96, "elapsed_time": "16:28:49", "remaining_time": "1:38:16", "throughput": 3347.96, "total_tokens": 198634224} +{"current_steps": 163350, "total_steps": 179580, "loss": 0.7565, "lr": 1.2339397754628613e-06, "epoch": 18.192449047778148, "percentage": 90.96, "elapsed_time": "16:28:51", "remaining_time": "1:38:15", "throughput": 3347.96, "total_tokens": 198640176} +{"current_steps": 163355, "total_steps": 179580, "loss": 0.5279, "lr": 1.2331859677901542e-06, "epoch": 18.193005902661767, "percentage": 90.97, "elapsed_time": "16:28:53", "remaining_time": "1:38:13", "throughput": 3347.96, "total_tokens": 198646096} +{"current_steps": 163360, "total_steps": 179580, "loss": 0.7856, "lr": 1.2324323846140462e-06, "epoch": 18.193562757545383, "percentage": 90.97, "elapsed_time": "16:28:55", "remaining_time": "1:38:11", "throughput": 3347.96, "total_tokens": 198652304} +{"current_steps": 163365, "total_steps": 179580, "loss": 0.7898, "lr": 1.2316790259416538e-06, "epoch": 18.194119612429002, "percentage": 90.97, "elapsed_time": "16:28:57", "remaining_time": "1:38:09", "throughput": 3347.97, "total_tokens": 198658640} +{"current_steps": 163370, "total_steps": 179580, "loss": 0.8158, "lr": 1.2309258917800993e-06, "epoch": 18.19467646731262, "percentage": 90.97, "elapsed_time": "16:28:58", "remaining_time": "1:38:07", "throughput": 3347.97, "total_tokens": 198665104} +{"current_steps": 163375, "total_steps": 179580, "loss": 0.6882, "lr": 1.2301729821364931e-06, "epoch": 18.195233322196234, "percentage": 90.98, "elapsed_time": "16:29:00", "remaining_time": "1:38:05", "throughput": 3347.98, "total_tokens": 198671184} +{"current_steps": 163380, "total_steps": 179580, "loss": 0.7008, "lr": 1.229420297017947e-06, "epoch": 18.195790177079854, "percentage": 90.98, "elapsed_time": "16:29:02", "remaining_time": "1:38:04", "throughput": 3347.98, "total_tokens": 198677168} +{"current_steps": 163385, "total_steps": 179580, "loss": 0.8296, "lr": 1.2286678364315656e-06, "epoch": 18.19634703196347, "percentage": 90.98, "elapsed_time": "16:29:04", "remaining_time": "1:38:02", "throughput": 3347.98, "total_tokens": 198683376} +{"current_steps": 163390, "total_steps": 179580, "loss": 0.5323, "lr": 1.2279156003844689e-06, "epoch": 18.19690388684709, "percentage": 90.98, "elapsed_time": "16:29:06", "remaining_time": "1:38:00", "throughput": 3347.99, "total_tokens": 198689680} +{"current_steps": 163395, "total_steps": 179580, "loss": 0.6948, "lr": 1.2271635888837534e-06, "epoch": 18.197460741730705, "percentage": 90.99, "elapsed_time": "16:29:07", "remaining_time": "1:37:58", "throughput": 3347.99, "total_tokens": 198695888} +{"current_steps": 163400, "total_steps": 179580, "loss": 0.863, "lr": 1.226411801936525e-06, "epoch": 18.19801759661432, "percentage": 90.99, "elapsed_time": "16:29:09", "remaining_time": "1:37:56", "throughput": 3347.99, "total_tokens": 198701968} +{"current_steps": 163405, "total_steps": 179580, "loss": 0.8268, "lr": 1.225660239549878e-06, "epoch": 18.19857445149794, "percentage": 90.99, "elapsed_time": "16:29:11", "remaining_time": "1:37:55", "throughput": 3348.0, "total_tokens": 198708272} +{"current_steps": 163410, "total_steps": 179580, "loss": 0.6373, "lr": 1.2249089017309256e-06, "epoch": 18.199131306381556, "percentage": 91.0, "elapsed_time": "16:29:13", "remaining_time": "1:37:53", "throughput": 3348.0, "total_tokens": 198714352} +{"current_steps": 163415, "total_steps": 179580, "loss": 0.6461, "lr": 1.2241577884867488e-06, "epoch": 18.199688161265176, "percentage": 91.0, "elapsed_time": "16:29:14", "remaining_time": "1:37:51", "throughput": 3348.0, "total_tokens": 198720528} +{"current_steps": 163420, "total_steps": 179580, "loss": 0.5606, "lr": 1.2234068998244586e-06, "epoch": 18.20024501614879, "percentage": 91.0, "elapsed_time": "16:29:16", "remaining_time": "1:37:49", "throughput": 3348.01, "total_tokens": 198726736} +{"current_steps": 163425, "total_steps": 179580, "loss": 0.6145, "lr": 1.2226562357511352e-06, "epoch": 18.200801871032407, "percentage": 91.0, "elapsed_time": "16:29:18", "remaining_time": "1:37:47", "throughput": 3348.01, "total_tokens": 198731984} +{"current_steps": 163430, "total_steps": 179580, "loss": 0.5193, "lr": 1.2219057962738783e-06, "epoch": 18.201358725916027, "percentage": 91.01, "elapsed_time": "16:29:19", "remaining_time": "1:37:45", "throughput": 3348.01, "total_tokens": 198738096} +{"current_steps": 163435, "total_steps": 179580, "loss": 0.7846, "lr": 1.221155581399766e-06, "epoch": 18.201915580799643, "percentage": 91.01, "elapsed_time": "16:29:21", "remaining_time": "1:37:44", "throughput": 3348.02, "total_tokens": 198744208} +{"current_steps": 163440, "total_steps": 179580, "loss": 0.6705, "lr": 1.2204055911358925e-06, "epoch": 18.202472435683262, "percentage": 91.01, "elapsed_time": "16:29:23", "remaining_time": "1:37:42", "throughput": 3348.02, "total_tokens": 198750416} +{"current_steps": 163445, "total_steps": 179580, "loss": 0.7488, "lr": 1.2196558254893437e-06, "epoch": 18.203029290566878, "percentage": 91.02, "elapsed_time": "16:29:25", "remaining_time": "1:37:40", "throughput": 3348.02, "total_tokens": 198756624} +{"current_steps": 163450, "total_steps": 179580, "loss": 0.6029, "lr": 1.2189062844671944e-06, "epoch": 18.203586145450494, "percentage": 91.02, "elapsed_time": "16:29:27", "remaining_time": "1:37:38", "throughput": 3348.03, "total_tokens": 198762928} +{"current_steps": 163455, "total_steps": 179580, "loss": 0.5481, "lr": 1.2181569680765282e-06, "epoch": 18.204143000334113, "percentage": 91.02, "elapsed_time": "16:29:28", "remaining_time": "1:37:36", "throughput": 3348.03, "total_tokens": 198769008} +{"current_steps": 163460, "total_steps": 179580, "loss": 1.0222, "lr": 1.217407876324425e-06, "epoch": 18.20469985521773, "percentage": 91.02, "elapsed_time": "16:29:30", "remaining_time": "1:37:34", "throughput": 3348.04, "total_tokens": 198775088} +{"current_steps": 163465, "total_steps": 179580, "loss": 0.5955, "lr": 1.2166590092179547e-06, "epoch": 18.20525671010135, "percentage": 91.03, "elapsed_time": "16:29:32", "remaining_time": "1:37:33", "throughput": 3348.04, "total_tokens": 198780880} +{"current_steps": 163470, "total_steps": 179580, "loss": 0.7799, "lr": 1.215910366764203e-06, "epoch": 18.205813564984965, "percentage": 91.03, "elapsed_time": "16:29:34", "remaining_time": "1:37:31", "throughput": 3348.04, "total_tokens": 198786960} +{"current_steps": 163475, "total_steps": 179580, "loss": 0.5191, "lr": 1.2151619489702255e-06, "epoch": 18.20637041986858, "percentage": 91.03, "elapsed_time": "16:29:35", "remaining_time": "1:37:29", "throughput": 3348.05, "total_tokens": 198792944} +{"current_steps": 163480, "total_steps": 179580, "loss": 0.5255, "lr": 1.2144137558431023e-06, "epoch": 18.2069272747522, "percentage": 91.03, "elapsed_time": "16:29:37", "remaining_time": "1:37:27", "throughput": 3348.05, "total_tokens": 198799056} +{"current_steps": 163485, "total_steps": 179580, "loss": 0.7822, "lr": 1.213665787389895e-06, "epoch": 18.207484129635816, "percentage": 91.04, "elapsed_time": "16:29:39", "remaining_time": "1:37:25", "throughput": 3348.06, "total_tokens": 198804880} +{"current_steps": 163490, "total_steps": 179580, "loss": 0.6912, "lr": 1.212918043617675e-06, "epoch": 18.208040984519435, "percentage": 91.04, "elapsed_time": "16:29:40", "remaining_time": "1:37:24", "throughput": 3348.06, "total_tokens": 198811120} +{"current_steps": 163495, "total_steps": 179580, "loss": 0.5975, "lr": 1.2121705245335042e-06, "epoch": 18.20859783940305, "percentage": 91.04, "elapsed_time": "16:29:42", "remaining_time": "1:37:22", "throughput": 3348.06, "total_tokens": 198816848} +{"current_steps": 163500, "total_steps": 179580, "loss": 0.9242, "lr": 1.21142323014444e-06, "epoch": 18.209154694286667, "percentage": 91.05, "elapsed_time": "16:29:44", "remaining_time": "1:37:20", "throughput": 3348.06, "total_tokens": 198822864} +{"current_steps": 163505, "total_steps": 179580, "loss": 0.8753, "lr": 1.2106761604575384e-06, "epoch": 18.209711549170287, "percentage": 91.05, "elapsed_time": "16:29:46", "remaining_time": "1:37:18", "throughput": 3348.07, "total_tokens": 198829264} +{"current_steps": 163510, "total_steps": 179580, "loss": 0.648, "lr": 1.209929315479863e-06, "epoch": 18.210268404053902, "percentage": 91.05, "elapsed_time": "16:29:47", "remaining_time": "1:37:16", "throughput": 3348.07, "total_tokens": 198834896} +{"current_steps": 163515, "total_steps": 179580, "loss": 0.6837, "lr": 1.2091826952184665e-06, "epoch": 18.210825258937522, "percentage": 91.05, "elapsed_time": "16:29:49", "remaining_time": "1:37:14", "throughput": 3348.07, "total_tokens": 198840880} +{"current_steps": 163520, "total_steps": 179580, "loss": 0.8159, "lr": 1.208436299680399e-06, "epoch": 18.211382113821138, "percentage": 91.06, "elapsed_time": "16:29:51", "remaining_time": "1:37:13", "throughput": 3348.08, "total_tokens": 198846960} +{"current_steps": 163525, "total_steps": 179580, "loss": 1.0367, "lr": 1.20769012887271e-06, "epoch": 18.211938968704757, "percentage": 91.06, "elapsed_time": "16:29:53", "remaining_time": "1:37:11", "throughput": 3348.08, "total_tokens": 198853200} +{"current_steps": 163530, "total_steps": 179580, "loss": 0.4751, "lr": 1.2069441828024526e-06, "epoch": 18.212495823588373, "percentage": 91.06, "elapsed_time": "16:29:54", "remaining_time": "1:37:09", "throughput": 3348.09, "total_tokens": 198859536} +{"current_steps": 163535, "total_steps": 179580, "loss": 0.667, "lr": 1.206198461476668e-06, "epoch": 18.21305267847199, "percentage": 91.07, "elapsed_time": "16:29:56", "remaining_time": "1:37:07", "throughput": 3348.09, "total_tokens": 198865168} +{"current_steps": 163540, "total_steps": 179580, "loss": 0.7528, "lr": 1.2054529649024094e-06, "epoch": 18.21360953335561, "percentage": 91.07, "elapsed_time": "16:29:58", "remaining_time": "1:37:05", "throughput": 3348.09, "total_tokens": 198870608} +{"current_steps": 163545, "total_steps": 179580, "loss": 0.7156, "lr": 1.2047076930867014e-06, "epoch": 18.214166388239224, "percentage": 91.07, "elapsed_time": "16:30:00", "remaining_time": "1:37:03", "throughput": 3348.09, "total_tokens": 198877008} +{"current_steps": 163550, "total_steps": 179580, "loss": 0.561, "lr": 1.2039626460365993e-06, "epoch": 18.214723243122844, "percentage": 91.07, "elapsed_time": "16:30:01", "remaining_time": "1:37:02", "throughput": 3348.1, "total_tokens": 198882992} +{"current_steps": 163555, "total_steps": 179580, "loss": 1.2468, "lr": 1.2032178237591312e-06, "epoch": 18.21528009800646, "percentage": 91.08, "elapsed_time": "16:30:03", "remaining_time": "1:37:00", "throughput": 3348.1, "total_tokens": 198889104} +{"current_steps": 163560, "total_steps": 179580, "loss": 0.9569, "lr": 1.2024732262613414e-06, "epoch": 18.215836952890076, "percentage": 91.08, "elapsed_time": "16:30:05", "remaining_time": "1:36:58", "throughput": 3348.1, "total_tokens": 198895376} +{"current_steps": 163565, "total_steps": 179580, "loss": 0.7589, "lr": 1.2017288535502574e-06, "epoch": 18.216393807773695, "percentage": 91.08, "elapsed_time": "16:30:07", "remaining_time": "1:36:56", "throughput": 3348.11, "total_tokens": 198901232} +{"current_steps": 163570, "total_steps": 179580, "loss": 0.57, "lr": 1.20098470563291e-06, "epoch": 18.21695066265731, "percentage": 91.08, "elapsed_time": "16:30:08", "remaining_time": "1:36:54", "throughput": 3348.11, "total_tokens": 198907632} +{"current_steps": 163575, "total_steps": 179580, "loss": 0.9066, "lr": 1.2002407825163264e-06, "epoch": 18.21750751754093, "percentage": 91.09, "elapsed_time": "16:30:10", "remaining_time": "1:36:53", "throughput": 3348.12, "total_tokens": 198913648} +{"current_steps": 163580, "total_steps": 179580, "loss": 0.6146, "lr": 1.1994970842075404e-06, "epoch": 18.218064372424546, "percentage": 91.09, "elapsed_time": "16:30:12", "remaining_time": "1:36:51", "throughput": 3348.12, "total_tokens": 198919632} +{"current_steps": 163585, "total_steps": 179580, "loss": 0.6494, "lr": 1.198753610713574e-06, "epoch": 18.218621227308162, "percentage": 91.09, "elapsed_time": "16:30:14", "remaining_time": "1:36:49", "throughput": 3348.12, "total_tokens": 198925872} +{"current_steps": 163590, "total_steps": 179580, "loss": 0.8287, "lr": 1.198010362041449e-06, "epoch": 18.21917808219178, "percentage": 91.1, "elapsed_time": "16:30:15", "remaining_time": "1:36:47", "throughput": 3348.13, "total_tokens": 198931952} +{"current_steps": 163595, "total_steps": 179580, "loss": 0.8223, "lr": 1.1972673381981797e-06, "epoch": 18.219734937075398, "percentage": 91.1, "elapsed_time": "16:30:17", "remaining_time": "1:36:45", "throughput": 3348.13, "total_tokens": 198937904} +{"current_steps": 163600, "total_steps": 179580, "loss": 0.7547, "lr": 1.1965245391907964e-06, "epoch": 18.220291791959017, "percentage": 91.1, "elapsed_time": "16:30:19", "remaining_time": "1:36:43", "throughput": 3348.13, "total_tokens": 198944272} +{"current_steps": 163605, "total_steps": 179580, "loss": 0.6409, "lr": 1.1957819650263075e-06, "epoch": 18.220848646842633, "percentage": 91.1, "elapsed_time": "16:30:21", "remaining_time": "1:36:42", "throughput": 3348.14, "total_tokens": 198950416} +{"current_steps": 163610, "total_steps": 179580, "loss": 0.6448, "lr": 1.1950396157117322e-06, "epoch": 18.22140550172625, "percentage": 91.11, "elapsed_time": "16:30:23", "remaining_time": "1:36:40", "throughput": 3348.14, "total_tokens": 198956688} +{"current_steps": 163615, "total_steps": 179580, "loss": 0.6673, "lr": 1.1942974912540788e-06, "epoch": 18.22196235660987, "percentage": 91.11, "elapsed_time": "16:30:24", "remaining_time": "1:36:38", "throughput": 3348.15, "total_tokens": 198962960} +{"current_steps": 163620, "total_steps": 179580, "loss": 0.8964, "lr": 1.1935555916603586e-06, "epoch": 18.222519211493484, "percentage": 91.11, "elapsed_time": "16:30:26", "remaining_time": "1:36:36", "throughput": 3348.15, "total_tokens": 198969104} +{"current_steps": 163625, "total_steps": 179580, "loss": 0.9077, "lr": 1.1928139169375769e-06, "epoch": 18.223076066377104, "percentage": 91.12, "elapsed_time": "16:30:28", "remaining_time": "1:36:34", "throughput": 3348.15, "total_tokens": 198975376} +{"current_steps": 163630, "total_steps": 179580, "loss": 0.7601, "lr": 1.1920724670927448e-06, "epoch": 18.22363292126072, "percentage": 91.12, "elapsed_time": "16:30:30", "remaining_time": "1:36:33", "throughput": 3348.16, "total_tokens": 198981648} +{"current_steps": 163635, "total_steps": 179580, "loss": 0.6118, "lr": 1.1913312421328622e-06, "epoch": 18.224189776144335, "percentage": 91.12, "elapsed_time": "16:30:31", "remaining_time": "1:36:31", "throughput": 3348.16, "total_tokens": 198987728} +{"current_steps": 163640, "total_steps": 179580, "loss": 0.6723, "lr": 1.1905902420649317e-06, "epoch": 18.224746631027955, "percentage": 91.12, "elapsed_time": "16:30:33", "remaining_time": "1:36:29", "throughput": 3348.16, "total_tokens": 198993808} +{"current_steps": 163645, "total_steps": 179580, "loss": 0.6805, "lr": 1.1898494668959481e-06, "epoch": 18.22530348591157, "percentage": 91.13, "elapsed_time": "16:30:35", "remaining_time": "1:36:27", "throughput": 3348.17, "total_tokens": 198999984} +{"current_steps": 163650, "total_steps": 179580, "loss": 0.9083, "lr": 1.1891089166329167e-06, "epoch": 18.22586034079519, "percentage": 91.13, "elapsed_time": "16:30:37", "remaining_time": "1:36:25", "throughput": 3348.17, "total_tokens": 199005552} +{"current_steps": 163655, "total_steps": 179580, "loss": 0.7146, "lr": 1.1883685912828262e-06, "epoch": 18.226417195678806, "percentage": 91.13, "elapsed_time": "16:30:38", "remaining_time": "1:36:23", "throughput": 3348.17, "total_tokens": 199011536} +{"current_steps": 163660, "total_steps": 179580, "loss": 0.6197, "lr": 1.1876284908526768e-06, "epoch": 18.226974050562422, "percentage": 91.13, "elapsed_time": "16:30:40", "remaining_time": "1:36:22", "throughput": 3348.18, "total_tokens": 199017360} +{"current_steps": 163665, "total_steps": 179580, "loss": 0.6904, "lr": 1.186888615349449e-06, "epoch": 18.22753090544604, "percentage": 91.14, "elapsed_time": "16:30:42", "remaining_time": "1:36:20", "throughput": 3348.18, "total_tokens": 199023696} +{"current_steps": 163670, "total_steps": 179580, "loss": 0.7165, "lr": 1.18614896478014e-06, "epoch": 18.228087760329657, "percentage": 91.14, "elapsed_time": "16:30:44", "remaining_time": "1:36:18", "throughput": 3348.18, "total_tokens": 199029616} +{"current_steps": 163675, "total_steps": 179580, "loss": 0.5316, "lr": 1.18540953915173e-06, "epoch": 18.228644615213277, "percentage": 91.14, "elapsed_time": "16:30:45", "remaining_time": "1:36:16", "throughput": 3348.18, "total_tokens": 199035792} +{"current_steps": 163680, "total_steps": 179580, "loss": 0.837, "lr": 1.184670338471211e-06, "epoch": 18.229201470096893, "percentage": 91.15, "elapsed_time": "16:30:47", "remaining_time": "1:36:14", "throughput": 3348.19, "total_tokens": 199041616} +{"current_steps": 163685, "total_steps": 179580, "loss": 0.719, "lr": 1.1839313627455578e-06, "epoch": 18.22975832498051, "percentage": 91.15, "elapsed_time": "16:30:49", "remaining_time": "1:36:12", "throughput": 3348.19, "total_tokens": 199047760} +{"current_steps": 163690, "total_steps": 179580, "loss": 0.7311, "lr": 1.1831926119817567e-06, "epoch": 18.230315179864128, "percentage": 91.15, "elapsed_time": "16:30:51", "remaining_time": "1:36:11", "throughput": 3348.19, "total_tokens": 199053712} +{"current_steps": 163695, "total_steps": 179580, "loss": 0.5672, "lr": 1.1824540861867794e-06, "epoch": 18.230872034747744, "percentage": 91.15, "elapsed_time": "16:30:52", "remaining_time": "1:36:09", "throughput": 3348.2, "total_tokens": 199059984} +{"current_steps": 163700, "total_steps": 179580, "loss": 0.769, "lr": 1.1817157853676098e-06, "epoch": 18.231428889631363, "percentage": 91.16, "elapsed_time": "16:30:54", "remaining_time": "1:36:07", "throughput": 3348.2, "total_tokens": 199065904} +{"current_steps": 163705, "total_steps": 179580, "loss": 0.7821, "lr": 1.1809777095312169e-06, "epoch": 18.23198574451498, "percentage": 91.16, "elapsed_time": "16:30:56", "remaining_time": "1:36:05", "throughput": 3348.2, "total_tokens": 199072272} +{"current_steps": 163710, "total_steps": 179580, "loss": 0.8064, "lr": 1.1802398586845732e-06, "epoch": 18.232542599398595, "percentage": 91.16, "elapsed_time": "16:30:58", "remaining_time": "1:36:03", "throughput": 3348.21, "total_tokens": 199078512} +{"current_steps": 163715, "total_steps": 179580, "loss": 0.7234, "lr": 1.1795022328346478e-06, "epoch": 18.233099454282215, "percentage": 91.17, "elapsed_time": "16:31:00", "remaining_time": "1:36:02", "throughput": 3348.21, "total_tokens": 199084592} +{"current_steps": 163720, "total_steps": 179580, "loss": 0.5747, "lr": 1.178764831988405e-06, "epoch": 18.23365630916583, "percentage": 91.17, "elapsed_time": "16:31:01", "remaining_time": "1:36:00", "throughput": 3348.21, "total_tokens": 199090640} +{"current_steps": 163725, "total_steps": 179580, "loss": 0.6437, "lr": 1.1780276561528163e-06, "epoch": 18.23421316404945, "percentage": 91.17, "elapsed_time": "16:31:03", "remaining_time": "1:35:58", "throughput": 3348.22, "total_tokens": 199096816} +{"current_steps": 163730, "total_steps": 179580, "loss": 0.5676, "lr": 1.1772907053348436e-06, "epoch": 18.234770018933066, "percentage": 91.17, "elapsed_time": "16:31:05", "remaining_time": "1:35:56", "throughput": 3348.22, "total_tokens": 199102608} +{"current_steps": 163735, "total_steps": 179580, "loss": 0.7972, "lr": 1.1765539795414448e-06, "epoch": 18.235326873816682, "percentage": 91.18, "elapsed_time": "16:31:07", "remaining_time": "1:35:54", "throughput": 3348.22, "total_tokens": 199108976} +{"current_steps": 163740, "total_steps": 179580, "loss": 0.5991, "lr": 1.1758174787795783e-06, "epoch": 18.2358837287003, "percentage": 91.18, "elapsed_time": "16:31:08", "remaining_time": "1:35:52", "throughput": 3348.23, "total_tokens": 199115248} +{"current_steps": 163745, "total_steps": 179580, "loss": 0.8018, "lr": 1.1750812030562081e-06, "epoch": 18.236440583583917, "percentage": 91.18, "elapsed_time": "16:31:10", "remaining_time": "1:35:51", "throughput": 3348.23, "total_tokens": 199121136} +{"current_steps": 163750, "total_steps": 179580, "loss": 0.7374, "lr": 1.1743451523782784e-06, "epoch": 18.236997438467537, "percentage": 91.18, "elapsed_time": "16:31:12", "remaining_time": "1:35:49", "throughput": 3348.23, "total_tokens": 199127216} +{"current_steps": 163755, "total_steps": 179580, "loss": 0.8647, "lr": 1.1736093267527531e-06, "epoch": 18.237554293351153, "percentage": 91.19, "elapsed_time": "16:31:14", "remaining_time": "1:35:47", "throughput": 3348.24, "total_tokens": 199133072} +{"current_steps": 163760, "total_steps": 179580, "loss": 0.6413, "lr": 1.1728737261865768e-06, "epoch": 18.23811114823477, "percentage": 91.19, "elapsed_time": "16:31:15", "remaining_time": "1:35:45", "throughput": 3348.24, "total_tokens": 199138800} +{"current_steps": 163765, "total_steps": 179580, "loss": 0.5484, "lr": 1.1721383506866968e-06, "epoch": 18.238668003118388, "percentage": 91.19, "elapsed_time": "16:31:17", "remaining_time": "1:35:43", "throughput": 3348.24, "total_tokens": 199144304} +{"current_steps": 163770, "total_steps": 179580, "loss": 0.774, "lr": 1.1714032002600572e-06, "epoch": 18.239224858002004, "percentage": 91.2, "elapsed_time": "16:31:19", "remaining_time": "1:35:41", "throughput": 3348.24, "total_tokens": 199150544} +{"current_steps": 163775, "total_steps": 179580, "loss": 0.6209, "lr": 1.170668274913611e-06, "epoch": 18.239781712885623, "percentage": 91.2, "elapsed_time": "16:31:20", "remaining_time": "1:35:40", "throughput": 3348.25, "total_tokens": 199156624} +{"current_steps": 163780, "total_steps": 179580, "loss": 0.9977, "lr": 1.1699335746542917e-06, "epoch": 18.24033856776924, "percentage": 91.2, "elapsed_time": "16:31:22", "remaining_time": "1:35:38", "throughput": 3348.25, "total_tokens": 199162096} +{"current_steps": 163785, "total_steps": 179580, "loss": 0.6952, "lr": 1.1691990994890433e-06, "epoch": 18.240895422652855, "percentage": 91.2, "elapsed_time": "16:31:24", "remaining_time": "1:35:36", "throughput": 3348.25, "total_tokens": 199168464} +{"current_steps": 163790, "total_steps": 179580, "loss": 0.4478, "lr": 1.1684648494247997e-06, "epoch": 18.241452277536474, "percentage": 91.21, "elapsed_time": "16:31:26", "remaining_time": "1:35:34", "throughput": 3348.25, "total_tokens": 199174352} +{"current_steps": 163795, "total_steps": 179580, "loss": 0.6546, "lr": 1.167730824468502e-06, "epoch": 18.24200913242009, "percentage": 91.21, "elapsed_time": "16:31:27", "remaining_time": "1:35:32", "throughput": 3348.26, "total_tokens": 199180432} +{"current_steps": 163800, "total_steps": 179580, "loss": 0.6554, "lr": 1.1669970246270784e-06, "epoch": 18.24256598730371, "percentage": 91.21, "elapsed_time": "16:31:29", "remaining_time": "1:35:31", "throughput": 3348.26, "total_tokens": 199186512} +{"current_steps": 163805, "total_steps": 179580, "loss": 0.6345, "lr": 1.1662634499074675e-06, "epoch": 18.243122842187326, "percentage": 91.22, "elapsed_time": "16:31:31", "remaining_time": "1:35:29", "throughput": 3348.27, "total_tokens": 199192496} +{"current_steps": 163810, "total_steps": 179580, "loss": 0.763, "lr": 1.1655301003165892e-06, "epoch": 18.24367969707094, "percentage": 91.22, "elapsed_time": "16:31:33", "remaining_time": "1:35:27", "throughput": 3348.27, "total_tokens": 199198576} +{"current_steps": 163815, "total_steps": 179580, "loss": 0.5177, "lr": 1.1647969758613764e-06, "epoch": 18.24423655195456, "percentage": 91.22, "elapsed_time": "16:31:34", "remaining_time": "1:35:25", "throughput": 3348.27, "total_tokens": 199205008} +{"current_steps": 163820, "total_steps": 179580, "loss": 0.7089, "lr": 1.1640640765487487e-06, "epoch": 18.244793406838177, "percentage": 91.22, "elapsed_time": "16:31:36", "remaining_time": "1:35:23", "throughput": 3348.27, "total_tokens": 199210928} +{"current_steps": 163825, "total_steps": 179580, "loss": 0.646, "lr": 1.1633314023856367e-06, "epoch": 18.245350261721796, "percentage": 91.23, "elapsed_time": "16:31:38", "remaining_time": "1:35:21", "throughput": 3348.28, "total_tokens": 199217488} +{"current_steps": 163830, "total_steps": 179580, "loss": 0.7775, "lr": 1.16259895337896e-06, "epoch": 18.245907116605412, "percentage": 91.23, "elapsed_time": "16:31:40", "remaining_time": "1:35:20", "throughput": 3348.28, "total_tokens": 199223920} +{"current_steps": 163835, "total_steps": 179580, "loss": 0.6526, "lr": 1.1618667295356295e-06, "epoch": 18.246463971489028, "percentage": 91.23, "elapsed_time": "16:31:42", "remaining_time": "1:35:18", "throughput": 3348.28, "total_tokens": 199230000} +{"current_steps": 163840, "total_steps": 179580, "loss": 0.6451, "lr": 1.1611347308625675e-06, "epoch": 18.247020826372648, "percentage": 91.24, "elapsed_time": "16:31:43", "remaining_time": "1:35:16", "throughput": 3348.29, "total_tokens": 199235952} +{"current_steps": 163845, "total_steps": 179580, "loss": 0.8129, "lr": 1.160402957366688e-06, "epoch": 18.247577681256264, "percentage": 91.24, "elapsed_time": "16:31:45", "remaining_time": "1:35:14", "throughput": 3348.29, "total_tokens": 199242064} +{"current_steps": 163850, "total_steps": 179580, "loss": 0.8033, "lr": 1.159671409054905e-06, "epoch": 18.248134536139883, "percentage": 91.24, "elapsed_time": "16:31:47", "remaining_time": "1:35:12", "throughput": 3348.29, "total_tokens": 199248112} +{"current_steps": 163855, "total_steps": 179580, "loss": 0.6251, "lr": 1.1589400859341237e-06, "epoch": 18.2486913910235, "percentage": 91.24, "elapsed_time": "16:31:49", "remaining_time": "1:35:11", "throughput": 3348.3, "total_tokens": 199254256} +{"current_steps": 163860, "total_steps": 179580, "loss": 0.6779, "lr": 1.1582089880112528e-06, "epoch": 18.24924824590712, "percentage": 91.25, "elapsed_time": "16:31:50", "remaining_time": "1:35:09", "throughput": 3348.3, "total_tokens": 199260560} +{"current_steps": 163865, "total_steps": 179580, "loss": 0.784, "lr": 1.1574781152932007e-06, "epoch": 18.249805100790734, "percentage": 91.25, "elapsed_time": "16:31:52", "remaining_time": "1:35:07", "throughput": 3348.31, "total_tokens": 199266160} +{"current_steps": 163870, "total_steps": 179580, "loss": 0.7349, "lr": 1.15674746778687e-06, "epoch": 18.25036195567435, "percentage": 91.25, "elapsed_time": "16:31:54", "remaining_time": "1:35:05", "throughput": 3348.31, "total_tokens": 199272432} +{"current_steps": 163875, "total_steps": 179580, "loss": 0.6538, "lr": 1.1560170454991664e-06, "epoch": 18.25091881055797, "percentage": 91.25, "elapsed_time": "16:31:56", "remaining_time": "1:35:03", "throughput": 3348.31, "total_tokens": 199278352} +{"current_steps": 163880, "total_steps": 179580, "loss": 0.5685, "lr": 1.155286848436979e-06, "epoch": 18.251475665441586, "percentage": 91.26, "elapsed_time": "16:31:57", "remaining_time": "1:35:01", "throughput": 3348.32, "total_tokens": 199284560} +{"current_steps": 163885, "total_steps": 179580, "loss": 0.7325, "lr": 1.1545568766072157e-06, "epoch": 18.252032520325205, "percentage": 91.26, "elapsed_time": "16:31:59", "remaining_time": "1:35:00", "throughput": 3348.32, "total_tokens": 199290672} +{"current_steps": 163890, "total_steps": 179580, "loss": 0.6039, "lr": 1.153827130016763e-06, "epoch": 18.25258937520882, "percentage": 91.26, "elapsed_time": "16:32:01", "remaining_time": "1:34:58", "throughput": 3348.32, "total_tokens": 199296784} +{"current_steps": 163895, "total_steps": 179580, "loss": 0.6136, "lr": 1.1530976086725236e-06, "epoch": 18.253146230092437, "percentage": 91.27, "elapsed_time": "16:32:03", "remaining_time": "1:34:56", "throughput": 3348.33, "total_tokens": 199302704} +{"current_steps": 163900, "total_steps": 179580, "loss": 0.6271, "lr": 1.1523683125813812e-06, "epoch": 18.253703084976056, "percentage": 91.27, "elapsed_time": "16:32:04", "remaining_time": "1:34:54", "throughput": 3348.33, "total_tokens": 199308816} +{"current_steps": 163905, "total_steps": 179580, "loss": 0.7205, "lr": 1.1516392417502269e-06, "epoch": 18.254259939859672, "percentage": 91.27, "elapsed_time": "16:32:06", "remaining_time": "1:34:52", "throughput": 3348.33, "total_tokens": 199314992} +{"current_steps": 163910, "total_steps": 179580, "loss": 0.7829, "lr": 1.1509103961859446e-06, "epoch": 18.25481679474329, "percentage": 91.27, "elapsed_time": "16:32:08", "remaining_time": "1:34:50", "throughput": 3348.34, "total_tokens": 199320976} +{"current_steps": 163915, "total_steps": 179580, "loss": 0.702, "lr": 1.1501817758954232e-06, "epoch": 18.255373649626907, "percentage": 91.28, "elapsed_time": "16:32:10", "remaining_time": "1:34:49", "throughput": 3348.34, "total_tokens": 199326928} +{"current_steps": 163920, "total_steps": 179580, "loss": 0.8042, "lr": 1.149453380885543e-06, "epoch": 18.255930504510523, "percentage": 91.28, "elapsed_time": "16:32:11", "remaining_time": "1:34:47", "throughput": 3348.34, "total_tokens": 199333232} +{"current_steps": 163925, "total_steps": 179580, "loss": 0.8929, "lr": 1.1487252111631847e-06, "epoch": 18.256487359394143, "percentage": 91.28, "elapsed_time": "16:32:13", "remaining_time": "1:34:45", "throughput": 3348.35, "total_tokens": 199339600} +{"current_steps": 163930, "total_steps": 179580, "loss": 0.8474, "lr": 1.1479972667352234e-06, "epoch": 18.25704421427776, "percentage": 91.29, "elapsed_time": "16:32:15", "remaining_time": "1:34:43", "throughput": 3348.35, "total_tokens": 199345360} +{"current_steps": 163935, "total_steps": 179580, "loss": 0.5285, "lr": 1.1472695476085427e-06, "epoch": 18.257601069161378, "percentage": 91.29, "elapsed_time": "16:32:17", "remaining_time": "1:34:41", "throughput": 3348.35, "total_tokens": 199351984} +{"current_steps": 163940, "total_steps": 179580, "loss": 0.6999, "lr": 1.1465420537900062e-06, "epoch": 18.258157924044994, "percentage": 91.29, "elapsed_time": "16:32:19", "remaining_time": "1:34:40", "throughput": 3348.36, "total_tokens": 199358224} +{"current_steps": 163945, "total_steps": 179580, "loss": 0.7152, "lr": 1.1458147852864975e-06, "epoch": 18.25871477892861, "percentage": 91.29, "elapsed_time": "16:32:20", "remaining_time": "1:34:38", "throughput": 3348.36, "total_tokens": 199364336} +{"current_steps": 163950, "total_steps": 179580, "loss": 0.751, "lr": 1.1450877421048723e-06, "epoch": 18.25927163381223, "percentage": 91.3, "elapsed_time": "16:32:22", "remaining_time": "1:34:36", "throughput": 3348.36, "total_tokens": 199370384} +{"current_steps": 163955, "total_steps": 179580, "loss": 0.6074, "lr": 1.1443609242520109e-06, "epoch": 18.259828488695845, "percentage": 91.3, "elapsed_time": "16:32:24", "remaining_time": "1:34:34", "throughput": 3348.37, "total_tokens": 199376528} +{"current_steps": 163960, "total_steps": 179580, "loss": 0.7532, "lr": 1.1436343317347692e-06, "epoch": 18.260385343579465, "percentage": 91.3, "elapsed_time": "16:32:26", "remaining_time": "1:34:32", "throughput": 3348.37, "total_tokens": 199382096} +{"current_steps": 163965, "total_steps": 179580, "loss": 0.992, "lr": 1.1429079645600167e-06, "epoch": 18.26094219846308, "percentage": 91.3, "elapsed_time": "16:32:27", "remaining_time": "1:34:30", "throughput": 3348.37, "total_tokens": 199388240} +{"current_steps": 163970, "total_steps": 179580, "loss": 0.7799, "lr": 1.1421818227346143e-06, "epoch": 18.261499053346697, "percentage": 91.31, "elapsed_time": "16:32:29", "remaining_time": "1:34:29", "throughput": 3348.37, "total_tokens": 199393776} +{"current_steps": 163975, "total_steps": 179580, "loss": 0.6874, "lr": 1.1414559062654207e-06, "epoch": 18.262055908230316, "percentage": 91.31, "elapsed_time": "16:32:31", "remaining_time": "1:34:27", "throughput": 3348.38, "total_tokens": 199399920} +{"current_steps": 163980, "total_steps": 179580, "loss": 0.9294, "lr": 1.1407302151592858e-06, "epoch": 18.262612763113932, "percentage": 91.31, "elapsed_time": "16:32:32", "remaining_time": "1:34:25", "throughput": 3348.38, "total_tokens": 199406000} +{"current_steps": 163985, "total_steps": 179580, "loss": 1.2315, "lr": 1.140004749423071e-06, "epoch": 18.26316961799755, "percentage": 91.32, "elapsed_time": "16:32:34", "remaining_time": "1:34:23", "throughput": 3348.38, "total_tokens": 199411216} +{"current_steps": 163990, "total_steps": 179580, "loss": 0.607, "lr": 1.1392795090636316e-06, "epoch": 18.263726472881167, "percentage": 91.32, "elapsed_time": "16:32:36", "remaining_time": "1:34:21", "throughput": 3348.38, "total_tokens": 199416976} +{"current_steps": 163995, "total_steps": 179580, "loss": 0.6906, "lr": 1.1385544940878124e-06, "epoch": 18.264283327764783, "percentage": 91.32, "elapsed_time": "16:32:38", "remaining_time": "1:34:19", "throughput": 3348.38, "total_tokens": 199423088} +{"current_steps": 164000, "total_steps": 179580, "loss": 1.0436, "lr": 1.1378297045024605e-06, "epoch": 18.264840182648403, "percentage": 91.32, "elapsed_time": "16:32:39", "remaining_time": "1:34:18", "throughput": 3348.39, "total_tokens": 199429136} +{"current_steps": 164005, "total_steps": 179580, "loss": 0.5821, "lr": 1.1371051403144261e-06, "epoch": 18.26539703753202, "percentage": 91.33, "elapsed_time": "16:32:41", "remaining_time": "1:34:16", "throughput": 3348.39, "total_tokens": 199435120} +{"current_steps": 164010, "total_steps": 179580, "loss": 0.7401, "lr": 1.1363808015305511e-06, "epoch": 18.265953892415638, "percentage": 91.33, "elapsed_time": "16:32:43", "remaining_time": "1:34:14", "throughput": 3348.39, "total_tokens": 199441168} +{"current_steps": 164015, "total_steps": 179580, "loss": 0.5937, "lr": 1.1356566881576824e-06, "epoch": 18.266510747299254, "percentage": 91.33, "elapsed_time": "16:32:45", "remaining_time": "1:34:12", "throughput": 3348.4, "total_tokens": 199447248} +{"current_steps": 164020, "total_steps": 179580, "loss": 0.6174, "lr": 1.1349328002026566e-06, "epoch": 18.26706760218287, "percentage": 91.34, "elapsed_time": "16:32:46", "remaining_time": "1:34:10", "throughput": 3348.4, "total_tokens": 199453136} +{"current_steps": 164025, "total_steps": 179580, "loss": 0.4045, "lr": 1.1342091376723096e-06, "epoch": 18.26762445706649, "percentage": 91.34, "elapsed_time": "16:32:48", "remaining_time": "1:34:09", "throughput": 3348.4, "total_tokens": 199459152} +{"current_steps": 164030, "total_steps": 179580, "loss": 0.8555, "lr": 1.133485700573475e-06, "epoch": 18.268181311950105, "percentage": 91.34, "elapsed_time": "16:32:50", "remaining_time": "1:34:07", "throughput": 3348.41, "total_tokens": 199465488} +{"current_steps": 164035, "total_steps": 179580, "loss": 1.1139, "lr": 1.1327624889129917e-06, "epoch": 18.268738166833725, "percentage": 91.34, "elapsed_time": "16:32:51", "remaining_time": "1:34:05", "throughput": 3348.41, "total_tokens": 199471664} +{"current_steps": 164040, "total_steps": 179580, "loss": 0.641, "lr": 1.1320395026976905e-06, "epoch": 18.26929502171734, "percentage": 91.35, "elapsed_time": "16:32:53", "remaining_time": "1:34:03", "throughput": 3348.42, "total_tokens": 199478032} +{"current_steps": 164045, "total_steps": 179580, "loss": 0.7252, "lr": 1.1313167419343963e-06, "epoch": 18.269851876600956, "percentage": 91.35, "elapsed_time": "16:32:55", "remaining_time": "1:34:01", "throughput": 3348.42, "total_tokens": 199483856} +{"current_steps": 164050, "total_steps": 179580, "loss": 0.6148, "lr": 1.1305942066299396e-06, "epoch": 18.270408731484576, "percentage": 91.35, "elapsed_time": "16:32:57", "remaining_time": "1:33:59", "throughput": 3348.42, "total_tokens": 199489744} +{"current_steps": 164055, "total_steps": 179580, "loss": 0.8609, "lr": 1.1298718967911458e-06, "epoch": 18.27096558636819, "percentage": 91.35, "elapsed_time": "16:32:58", "remaining_time": "1:33:58", "throughput": 3348.43, "total_tokens": 199495760} +{"current_steps": 164060, "total_steps": 179580, "loss": 0.6478, "lr": 1.1291498124248317e-06, "epoch": 18.27152244125181, "percentage": 91.36, "elapsed_time": "16:33:00", "remaining_time": "1:33:56", "throughput": 3348.43, "total_tokens": 199501584} +{"current_steps": 164065, "total_steps": 179580, "loss": 0.5997, "lr": 1.1284279535378305e-06, "epoch": 18.272079296135427, "percentage": 91.36, "elapsed_time": "16:33:02", "remaining_time": "1:33:54", "throughput": 3348.43, "total_tokens": 199507760} +{"current_steps": 164070, "total_steps": 179580, "loss": 0.5672, "lr": 1.1277063201369454e-06, "epoch": 18.272636151019043, "percentage": 91.36, "elapsed_time": "16:33:04", "remaining_time": "1:33:52", "throughput": 3348.44, "total_tokens": 199513808} +{"current_steps": 164075, "total_steps": 179580, "loss": 0.6571, "lr": 1.126984912229004e-06, "epoch": 18.273193005902662, "percentage": 91.37, "elapsed_time": "16:33:05", "remaining_time": "1:33:50", "throughput": 3348.44, "total_tokens": 199519824} +{"current_steps": 164080, "total_steps": 179580, "loss": 0.745, "lr": 1.1262637298208145e-06, "epoch": 18.27374986078628, "percentage": 91.37, "elapsed_time": "16:33:07", "remaining_time": "1:33:49", "throughput": 3348.44, "total_tokens": 199525808} +{"current_steps": 164085, "total_steps": 179580, "loss": 0.8833, "lr": 1.1255427729191942e-06, "epoch": 18.274306715669898, "percentage": 91.37, "elapsed_time": "16:33:09", "remaining_time": "1:33:47", "throughput": 3348.44, "total_tokens": 199531568} +{"current_steps": 164090, "total_steps": 179580, "loss": 0.9616, "lr": 1.1248220415309512e-06, "epoch": 18.274863570553514, "percentage": 91.37, "elapsed_time": "16:33:10", "remaining_time": "1:33:45", "throughput": 3348.45, "total_tokens": 199537232} +{"current_steps": 164095, "total_steps": 179580, "loss": 0.7364, "lr": 1.1241015356628915e-06, "epoch": 18.27542042543713, "percentage": 91.38, "elapsed_time": "16:33:12", "remaining_time": "1:33:43", "throughput": 3348.45, "total_tokens": 199543504} +{"current_steps": 164100, "total_steps": 179580, "loss": 0.6721, "lr": 1.1233812553218177e-06, "epoch": 18.27597728032075, "percentage": 91.38, "elapsed_time": "16:33:14", "remaining_time": "1:33:41", "throughput": 3348.45, "total_tokens": 199549520} +{"current_steps": 164105, "total_steps": 179580, "loss": 0.5687, "lr": 1.1226612005145409e-06, "epoch": 18.276534135204365, "percentage": 91.38, "elapsed_time": "16:33:16", "remaining_time": "1:33:39", "throughput": 3348.46, "total_tokens": 199555536} +{"current_steps": 164110, "total_steps": 179580, "loss": 0.8696, "lr": 1.1219413712478616e-06, "epoch": 18.277090990087984, "percentage": 91.39, "elapsed_time": "16:33:17", "remaining_time": "1:33:38", "throughput": 3348.46, "total_tokens": 199560912} +{"current_steps": 164115, "total_steps": 179580, "loss": 0.4967, "lr": 1.121221767528574e-06, "epoch": 18.2776478449716, "percentage": 91.39, "elapsed_time": "16:33:19", "remaining_time": "1:33:36", "throughput": 3348.46, "total_tokens": 199567280} +{"current_steps": 164120, "total_steps": 179580, "loss": 0.8112, "lr": 1.1205023893634758e-06, "epoch": 18.278204699855216, "percentage": 91.39, "elapsed_time": "16:33:21", "remaining_time": "1:33:34", "throughput": 3348.46, "total_tokens": 199573008} +{"current_steps": 164125, "total_steps": 179580, "loss": 0.5734, "lr": 1.1197832367593697e-06, "epoch": 18.278761554738836, "percentage": 91.39, "elapsed_time": "16:33:23", "remaining_time": "1:33:32", "throughput": 3348.47, "total_tokens": 199579248} +{"current_steps": 164130, "total_steps": 179580, "loss": 0.8097, "lr": 1.119064309723042e-06, "epoch": 18.27931840962245, "percentage": 91.4, "elapsed_time": "16:33:24", "remaining_time": "1:33:30", "throughput": 3348.47, "total_tokens": 199585328} +{"current_steps": 164135, "total_steps": 179580, "loss": 0.5328, "lr": 1.1183456082612843e-06, "epoch": 18.27987526450607, "percentage": 91.4, "elapsed_time": "16:33:26", "remaining_time": "1:33:28", "throughput": 3348.48, "total_tokens": 199591088} +{"current_steps": 164140, "total_steps": 179580, "loss": 0.7231, "lr": 1.1176271323808856e-06, "epoch": 18.280432119389687, "percentage": 91.4, "elapsed_time": "16:33:28", "remaining_time": "1:33:27", "throughput": 3348.48, "total_tokens": 199597200} +{"current_steps": 164145, "total_steps": 179580, "loss": 0.8, "lr": 1.1169088820886298e-06, "epoch": 18.280988974273303, "percentage": 91.4, "elapsed_time": "16:33:30", "remaining_time": "1:33:25", "throughput": 3348.48, "total_tokens": 199603344} +{"current_steps": 164150, "total_steps": 179580, "loss": 0.8344, "lr": 1.116190857391311e-06, "epoch": 18.281545829156922, "percentage": 91.41, "elapsed_time": "16:33:31", "remaining_time": "1:33:23", "throughput": 3348.48, "total_tokens": 199609328} +{"current_steps": 164155, "total_steps": 179580, "loss": 0.5266, "lr": 1.115473058295699e-06, "epoch": 18.282102684040538, "percentage": 91.41, "elapsed_time": "16:33:33", "remaining_time": "1:33:21", "throughput": 3348.49, "total_tokens": 199615632} +{"current_steps": 164160, "total_steps": 179580, "loss": 0.7556, "lr": 1.114755484808583e-06, "epoch": 18.282659538924158, "percentage": 91.41, "elapsed_time": "16:33:35", "remaining_time": "1:33:19", "throughput": 3348.49, "total_tokens": 199621904} +{"current_steps": 164165, "total_steps": 179580, "loss": 0.6686, "lr": 1.1140381369367374e-06, "epoch": 18.283216393807773, "percentage": 91.42, "elapsed_time": "16:33:37", "remaining_time": "1:33:18", "throughput": 3348.5, "total_tokens": 199628016} +{"current_steps": 164170, "total_steps": 179580, "loss": 0.6134, "lr": 1.1133210146869382e-06, "epoch": 18.28377324869139, "percentage": 91.42, "elapsed_time": "16:33:38", "remaining_time": "1:33:16", "throughput": 3348.5, "total_tokens": 199634160} +{"current_steps": 164175, "total_steps": 179580, "loss": 0.5489, "lr": 1.1126041180659602e-06, "epoch": 18.28433010357501, "percentage": 91.42, "elapsed_time": "16:33:40", "remaining_time": "1:33:14", "throughput": 3348.51, "total_tokens": 199640176} +{"current_steps": 164180, "total_steps": 179580, "loss": 0.6932, "lr": 1.1118874470805757e-06, "epoch": 18.284886958458625, "percentage": 91.42, "elapsed_time": "16:33:42", "remaining_time": "1:33:12", "throughput": 3348.51, "total_tokens": 199646288} +{"current_steps": 164185, "total_steps": 179580, "loss": 0.9667, "lr": 1.1111710017375516e-06, "epoch": 18.285443813342244, "percentage": 91.43, "elapsed_time": "16:33:44", "remaining_time": "1:33:10", "throughput": 3348.51, "total_tokens": 199652464} +{"current_steps": 164190, "total_steps": 179580, "loss": 0.9172, "lr": 1.1104547820436572e-06, "epoch": 18.28600066822586, "percentage": 91.43, "elapsed_time": "16:33:45", "remaining_time": "1:33:08", "throughput": 3348.52, "total_tokens": 199658256} +{"current_steps": 164195, "total_steps": 179580, "loss": 0.5834, "lr": 1.109738788005657e-06, "epoch": 18.28655752310948, "percentage": 91.43, "elapsed_time": "16:33:47", "remaining_time": "1:33:07", "throughput": 3348.52, "total_tokens": 199664688} +{"current_steps": 164200, "total_steps": 179580, "loss": 0.9198, "lr": 1.1090230196303148e-06, "epoch": 18.287114377993095, "percentage": 91.44, "elapsed_time": "16:33:49", "remaining_time": "1:33:05", "throughput": 3348.53, "total_tokens": 199671056} +{"current_steps": 164205, "total_steps": 179580, "loss": 0.8431, "lr": 1.108307476924389e-06, "epoch": 18.28767123287671, "percentage": 91.44, "elapsed_time": "16:33:51", "remaining_time": "1:33:03", "throughput": 3348.53, "total_tokens": 199677296} +{"current_steps": 164210, "total_steps": 179580, "loss": 0.8249, "lr": 1.1075921598946464e-06, "epoch": 18.28822808776033, "percentage": 91.44, "elapsed_time": "16:33:53", "remaining_time": "1:33:01", "throughput": 3348.53, "total_tokens": 199683568} +{"current_steps": 164215, "total_steps": 179580, "loss": 0.9149, "lr": 1.1068770685478319e-06, "epoch": 18.288784942643947, "percentage": 91.44, "elapsed_time": "16:33:54", "remaining_time": "1:32:59", "throughput": 3348.54, "total_tokens": 199689840} +{"current_steps": 164220, "total_steps": 179580, "loss": 0.6949, "lr": 1.106162202890712e-06, "epoch": 18.289341797527566, "percentage": 91.45, "elapsed_time": "16:33:56", "remaining_time": "1:32:58", "throughput": 3348.54, "total_tokens": 199695824} +{"current_steps": 164225, "total_steps": 179580, "loss": 0.6194, "lr": 1.1054475629300286e-06, "epoch": 18.289898652411182, "percentage": 91.45, "elapsed_time": "16:33:58", "remaining_time": "1:32:56", "throughput": 3348.54, "total_tokens": 199701968} +{"current_steps": 164230, "total_steps": 179580, "loss": 0.6854, "lr": 1.1047331486725405e-06, "epoch": 18.290455507294798, "percentage": 91.45, "elapsed_time": "16:34:00", "remaining_time": "1:32:54", "throughput": 3348.55, "total_tokens": 199708592} +{"current_steps": 164235, "total_steps": 179580, "loss": 0.7949, "lr": 1.1040189601249917e-06, "epoch": 18.291012362178417, "percentage": 91.46, "elapsed_time": "16:34:02", "remaining_time": "1:32:52", "throughput": 3348.55, "total_tokens": 199714512} +{"current_steps": 164240, "total_steps": 179580, "loss": 0.8255, "lr": 1.1033049972941272e-06, "epoch": 18.291569217062033, "percentage": 91.46, "elapsed_time": "16:34:03", "remaining_time": "1:32:50", "throughput": 3348.56, "total_tokens": 199720592} +{"current_steps": 164245, "total_steps": 179580, "loss": 0.8276, "lr": 1.1025912601866917e-06, "epoch": 18.292126071945653, "percentage": 91.46, "elapsed_time": "16:34:05", "remaining_time": "1:32:48", "throughput": 3348.56, "total_tokens": 199726416} +{"current_steps": 164250, "total_steps": 179580, "loss": 0.8338, "lr": 1.1018777488094323e-06, "epoch": 18.29268292682927, "percentage": 91.46, "elapsed_time": "16:34:07", "remaining_time": "1:32:47", "throughput": 3348.56, "total_tokens": 199732464} +{"current_steps": 164255, "total_steps": 179580, "loss": 0.8728, "lr": 1.1011644631690827e-06, "epoch": 18.293239781712884, "percentage": 91.47, "elapsed_time": "16:34:09", "remaining_time": "1:32:45", "throughput": 3348.56, "total_tokens": 199738544} +{"current_steps": 164260, "total_steps": 179580, "loss": 0.8717, "lr": 1.1004514032723818e-06, "epoch": 18.293796636596504, "percentage": 91.47, "elapsed_time": "16:34:10", "remaining_time": "1:32:43", "throughput": 3348.57, "total_tokens": 199744848} +{"current_steps": 164265, "total_steps": 179580, "loss": 0.6667, "lr": 1.0997385691260631e-06, "epoch": 18.29435349148012, "percentage": 91.47, "elapsed_time": "16:34:12", "remaining_time": "1:32:41", "throughput": 3348.57, "total_tokens": 199750256} +{"current_steps": 164270, "total_steps": 179580, "loss": 0.8287, "lr": 1.0990259607368659e-06, "epoch": 18.29491034636374, "percentage": 91.47, "elapsed_time": "16:34:14", "remaining_time": "1:32:39", "throughput": 3348.57, "total_tokens": 199756528} +{"current_steps": 164275, "total_steps": 179580, "loss": 0.623, "lr": 1.0983135781115151e-06, "epoch": 18.295467201247355, "percentage": 91.48, "elapsed_time": "16:34:16", "remaining_time": "1:32:37", "throughput": 3348.58, "total_tokens": 199762864} +{"current_steps": 164280, "total_steps": 179580, "loss": 0.7724, "lr": 1.097601421256747e-06, "epoch": 18.29602405613097, "percentage": 91.48, "elapsed_time": "16:34:17", "remaining_time": "1:32:36", "throughput": 3348.58, "total_tokens": 199768944} +{"current_steps": 164285, "total_steps": 179580, "loss": 0.6946, "lr": 1.0968894901792758e-06, "epoch": 18.29658091101459, "percentage": 91.48, "elapsed_time": "16:34:19", "remaining_time": "1:32:34", "throughput": 3348.59, "total_tokens": 199775312} +{"current_steps": 164290, "total_steps": 179580, "loss": 0.7863, "lr": 1.0961777848858407e-06, "epoch": 18.297137765898206, "percentage": 91.49, "elapsed_time": "16:34:21", "remaining_time": "1:32:32", "throughput": 3348.59, "total_tokens": 199781488} +{"current_steps": 164295, "total_steps": 179580, "loss": 0.6591, "lr": 1.0954663053831526e-06, "epoch": 18.297694620781826, "percentage": 91.49, "elapsed_time": "16:34:23", "remaining_time": "1:32:30", "throughput": 3348.59, "total_tokens": 199787440} +{"current_steps": 164300, "total_steps": 179580, "loss": 0.7668, "lr": 1.0947550516779425e-06, "epoch": 18.29825147566544, "percentage": 91.49, "elapsed_time": "16:34:24", "remaining_time": "1:32:28", "throughput": 3348.6, "total_tokens": 199793488} +{"current_steps": 164305, "total_steps": 179580, "loss": 0.9008, "lr": 1.0940440237769217e-06, "epoch": 18.298808330549058, "percentage": 91.49, "elapsed_time": "16:34:26", "remaining_time": "1:32:27", "throughput": 3348.6, "total_tokens": 199799696} +{"current_steps": 164310, "total_steps": 179580, "loss": 0.671, "lr": 1.093333221686807e-06, "epoch": 18.299365185432677, "percentage": 91.5, "elapsed_time": "16:34:28", "remaining_time": "1:32:25", "throughput": 3348.6, "total_tokens": 199805744} +{"current_steps": 164315, "total_steps": 179580, "loss": 0.6845, "lr": 1.0926226454143124e-06, "epoch": 18.299922040316293, "percentage": 91.5, "elapsed_time": "16:34:30", "remaining_time": "1:32:23", "throughput": 3348.61, "total_tokens": 199811920} +{"current_steps": 164320, "total_steps": 179580, "loss": 0.6234, "lr": 1.0919122949661548e-06, "epoch": 18.300478895199912, "percentage": 91.5, "elapsed_time": "16:34:31", "remaining_time": "1:32:21", "throughput": 3348.61, "total_tokens": 199817968} +{"current_steps": 164325, "total_steps": 179580, "loss": 0.9589, "lr": 1.09120217034904e-06, "epoch": 18.30103575008353, "percentage": 91.51, "elapsed_time": "16:34:33", "remaining_time": "1:32:19", "throughput": 3348.61, "total_tokens": 199824016} +{"current_steps": 164330, "total_steps": 179580, "loss": 0.5381, "lr": 1.0904922715696765e-06, "epoch": 18.301592604967144, "percentage": 91.51, "elapsed_time": "16:34:35", "remaining_time": "1:32:17", "throughput": 3348.61, "total_tokens": 199829808} +{"current_steps": 164335, "total_steps": 179580, "loss": 0.7021, "lr": 1.0897825986347643e-06, "epoch": 18.302149459850764, "percentage": 91.51, "elapsed_time": "16:34:37", "remaining_time": "1:32:16", "throughput": 3348.62, "total_tokens": 199835856} +{"current_steps": 164340, "total_steps": 179580, "loss": 0.5312, "lr": 1.0890731515510178e-06, "epoch": 18.30270631473438, "percentage": 91.51, "elapsed_time": "16:34:38", "remaining_time": "1:32:14", "throughput": 3348.62, "total_tokens": 199841968} +{"current_steps": 164345, "total_steps": 179580, "loss": 0.5515, "lr": 1.0883639303251286e-06, "epoch": 18.303263169618, "percentage": 91.52, "elapsed_time": "16:34:40", "remaining_time": "1:32:12", "throughput": 3348.62, "total_tokens": 199847504} +{"current_steps": 164350, "total_steps": 179580, "loss": 0.6273, "lr": 1.0876549349638055e-06, "epoch": 18.303820024501615, "percentage": 91.52, "elapsed_time": "16:34:42", "remaining_time": "1:32:10", "throughput": 3348.63, "total_tokens": 199853872} +{"current_steps": 164355, "total_steps": 179580, "loss": 0.7135, "lr": 1.0869461654737318e-06, "epoch": 18.30437687938523, "percentage": 91.52, "elapsed_time": "16:34:44", "remaining_time": "1:32:08", "throughput": 3348.63, "total_tokens": 199859888} +{"current_steps": 164360, "total_steps": 179580, "loss": 0.6713, "lr": 1.086237621861616e-06, "epoch": 18.30493373426885, "percentage": 91.52, "elapsed_time": "16:34:45", "remaining_time": "1:32:07", "throughput": 3348.63, "total_tokens": 199865904} +{"current_steps": 164365, "total_steps": 179580, "loss": 0.6176, "lr": 1.0855293041341419e-06, "epoch": 18.305490589152466, "percentage": 91.53, "elapsed_time": "16:34:47", "remaining_time": "1:32:05", "throughput": 3348.63, "total_tokens": 199871856} +{"current_steps": 164370, "total_steps": 179580, "loss": 0.5368, "lr": 1.0848212122980068e-06, "epoch": 18.306047444036086, "percentage": 91.53, "elapsed_time": "16:34:49", "remaining_time": "1:32:03", "throughput": 3348.64, "total_tokens": 199878224} +{"current_steps": 164375, "total_steps": 179580, "loss": 0.6879, "lr": 1.084113346359894e-06, "epoch": 18.3066042989197, "percentage": 91.53, "elapsed_time": "16:34:51", "remaining_time": "1:32:01", "throughput": 3348.64, "total_tokens": 199884080} +{"current_steps": 164380, "total_steps": 179580, "loss": 0.5739, "lr": 1.083405706326493e-06, "epoch": 18.307161153803317, "percentage": 91.54, "elapsed_time": "16:34:52", "remaining_time": "1:31:59", "throughput": 3348.65, "total_tokens": 199890192} +{"current_steps": 164385, "total_steps": 179580, "loss": 0.6076, "lr": 1.0826982922044843e-06, "epoch": 18.307718008686937, "percentage": 91.54, "elapsed_time": "16:34:54", "remaining_time": "1:31:57", "throughput": 3348.65, "total_tokens": 199896496} +{"current_steps": 164390, "total_steps": 179580, "loss": 0.6845, "lr": 1.0819911040005543e-06, "epoch": 18.308274863570553, "percentage": 91.54, "elapsed_time": "16:34:56", "remaining_time": "1:31:56", "throughput": 3348.65, "total_tokens": 199902512} +{"current_steps": 164395, "total_steps": 179580, "loss": 0.6692, "lr": 1.081284141721381e-06, "epoch": 18.308831718454172, "percentage": 91.54, "elapsed_time": "16:34:58", "remaining_time": "1:31:54", "throughput": 3348.65, "total_tokens": 199908752} +{"current_steps": 164400, "total_steps": 179580, "loss": 0.7375, "lr": 1.080577405373645e-06, "epoch": 18.309388573337788, "percentage": 91.55, "elapsed_time": "16:34:59", "remaining_time": "1:31:52", "throughput": 3348.66, "total_tokens": 199914640} +{"current_steps": 164405, "total_steps": 179580, "loss": 0.8076, "lr": 1.0798708949640136e-06, "epoch": 18.309945428221404, "percentage": 91.55, "elapsed_time": "16:35:01", "remaining_time": "1:31:50", "throughput": 3348.66, "total_tokens": 199920688} +{"current_steps": 164410, "total_steps": 179580, "loss": 0.6961, "lr": 1.0791646104991698e-06, "epoch": 18.310502283105023, "percentage": 91.55, "elapsed_time": "16:35:03", "remaining_time": "1:31:48", "throughput": 3348.66, "total_tokens": 199926864} +{"current_steps": 164415, "total_steps": 179580, "loss": 0.8199, "lr": 1.0784585519857782e-06, "epoch": 18.31105913798864, "percentage": 91.56, "elapsed_time": "16:35:05", "remaining_time": "1:31:46", "throughput": 3348.67, "total_tokens": 199932912} +{"current_steps": 164420, "total_steps": 179580, "loss": 0.6934, "lr": 1.0777527194305138e-06, "epoch": 18.31161599287226, "percentage": 91.56, "elapsed_time": "16:35:06", "remaining_time": "1:31:45", "throughput": 3348.67, "total_tokens": 199938928} +{"current_steps": 164425, "total_steps": 179580, "loss": 0.5614, "lr": 1.0770471128400433e-06, "epoch": 18.312172847755875, "percentage": 91.56, "elapsed_time": "16:35:08", "remaining_time": "1:31:43", "throughput": 3348.67, "total_tokens": 199944816} +{"current_steps": 164430, "total_steps": 179580, "loss": 0.679, "lr": 1.0763417322210256e-06, "epoch": 18.31272970263949, "percentage": 91.56, "elapsed_time": "16:35:10", "remaining_time": "1:31:41", "throughput": 3348.67, "total_tokens": 199950000} +{"current_steps": 164435, "total_steps": 179580, "loss": 0.4765, "lr": 1.0756365775801275e-06, "epoch": 18.31328655752311, "percentage": 91.57, "elapsed_time": "16:35:11", "remaining_time": "1:31:39", "throughput": 3348.68, "total_tokens": 199955888} +{"current_steps": 164440, "total_steps": 179580, "loss": 0.6596, "lr": 1.0749316489240129e-06, "epoch": 18.313843412406726, "percentage": 91.57, "elapsed_time": "16:35:13", "remaining_time": "1:31:37", "throughput": 3348.68, "total_tokens": 199962288} +{"current_steps": 164445, "total_steps": 179580, "loss": 0.6536, "lr": 1.0742269462593352e-06, "epoch": 18.314400267290345, "percentage": 91.57, "elapsed_time": "16:35:15", "remaining_time": "1:31:36", "throughput": 3348.69, "total_tokens": 199968208} +{"current_steps": 164450, "total_steps": 179580, "loss": 0.7757, "lr": 1.0735224695927554e-06, "epoch": 18.31495712217396, "percentage": 91.57, "elapsed_time": "16:35:17", "remaining_time": "1:31:34", "throughput": 3348.69, "total_tokens": 199973744} +{"current_steps": 164455, "total_steps": 179580, "loss": 0.9502, "lr": 1.0728182189309211e-06, "epoch": 18.315513977057577, "percentage": 91.58, "elapsed_time": "16:35:18", "remaining_time": "1:31:32", "throughput": 3348.69, "total_tokens": 199979760} +{"current_steps": 164460, "total_steps": 179580, "loss": 0.9197, "lr": 1.0721141942804936e-06, "epoch": 18.316070831941197, "percentage": 91.58, "elapsed_time": "16:35:20", "remaining_time": "1:31:30", "throughput": 3348.69, "total_tokens": 199985808} +{"current_steps": 164465, "total_steps": 179580, "loss": 0.8093, "lr": 1.071410395648112e-06, "epoch": 18.316627686824813, "percentage": 91.58, "elapsed_time": "16:35:22", "remaining_time": "1:31:28", "throughput": 3348.7, "total_tokens": 199991952} +{"current_steps": 164470, "total_steps": 179580, "loss": 0.7973, "lr": 1.0707068230404404e-06, "epoch": 18.317184541708432, "percentage": 91.59, "elapsed_time": "16:35:24", "remaining_time": "1:31:26", "throughput": 3348.7, "total_tokens": 199997968} +{"current_steps": 164475, "total_steps": 179580, "loss": 0.82, "lr": 1.0700034764641042e-06, "epoch": 18.317741396592048, "percentage": 91.59, "elapsed_time": "16:35:25", "remaining_time": "1:31:25", "throughput": 3348.7, "total_tokens": 200003984} +{"current_steps": 164480, "total_steps": 179580, "loss": 0.789, "lr": 1.0693003559257647e-06, "epoch": 18.318298251475664, "percentage": 91.59, "elapsed_time": "16:35:27", "remaining_time": "1:31:23", "throughput": 3348.71, "total_tokens": 200010032} +{"current_steps": 164485, "total_steps": 179580, "loss": 0.5701, "lr": 1.06859746143205e-06, "epoch": 18.318855106359283, "percentage": 91.59, "elapsed_time": "16:35:29", "remaining_time": "1:31:21", "throughput": 3348.71, "total_tokens": 200015280} +{"current_steps": 164490, "total_steps": 179580, "loss": 0.6286, "lr": 1.06789479298961e-06, "epoch": 18.3194119612429, "percentage": 91.6, "elapsed_time": "16:35:30", "remaining_time": "1:31:19", "throughput": 3348.71, "total_tokens": 200021648} +{"current_steps": 164495, "total_steps": 179580, "loss": 0.7746, "lr": 1.0671923506050785e-06, "epoch": 18.31996881612652, "percentage": 91.6, "elapsed_time": "16:35:32", "remaining_time": "1:31:17", "throughput": 3348.72, "total_tokens": 200027920} +{"current_steps": 164500, "total_steps": 179580, "loss": 0.882, "lr": 1.0664901342850891e-06, "epoch": 18.320525671010135, "percentage": 91.6, "elapsed_time": "16:35:34", "remaining_time": "1:31:15", "throughput": 3348.72, "total_tokens": 200034128} +{"current_steps": 164505, "total_steps": 179580, "loss": 0.5187, "lr": 1.0657881440362755e-06, "epoch": 18.32108252589375, "percentage": 91.61, "elapsed_time": "16:35:36", "remaining_time": "1:31:14", "throughput": 3348.72, "total_tokens": 200040240} +{"current_steps": 164510, "total_steps": 179580, "loss": 0.5756, "lr": 1.0650863798652683e-06, "epoch": 18.32163938077737, "percentage": 91.61, "elapsed_time": "16:35:38", "remaining_time": "1:31:12", "throughput": 3348.73, "total_tokens": 200046576} +{"current_steps": 164515, "total_steps": 179580, "loss": 0.6382, "lr": 1.0643848417786984e-06, "epoch": 18.322196235660986, "percentage": 91.61, "elapsed_time": "16:35:39", "remaining_time": "1:31:10", "throughput": 3348.73, "total_tokens": 200052752} +{"current_steps": 164520, "total_steps": 179580, "loss": 0.7404, "lr": 1.0636835297831882e-06, "epoch": 18.322753090544605, "percentage": 91.61, "elapsed_time": "16:35:41", "remaining_time": "1:31:08", "throughput": 3348.74, "total_tokens": 200059120} +{"current_steps": 164525, "total_steps": 179580, "loss": 0.8008, "lr": 1.062982443885363e-06, "epoch": 18.32330994542822, "percentage": 91.62, "elapsed_time": "16:35:43", "remaining_time": "1:31:06", "throughput": 3348.74, "total_tokens": 200065296} +{"current_steps": 164530, "total_steps": 179580, "loss": 0.5578, "lr": 1.0622815840918481e-06, "epoch": 18.323866800311837, "percentage": 91.62, "elapsed_time": "16:35:45", "remaining_time": "1:31:05", "throughput": 3348.74, "total_tokens": 200071504} +{"current_steps": 164535, "total_steps": 179580, "loss": 0.7773, "lr": 1.0615809504092633e-06, "epoch": 18.324423655195456, "percentage": 91.62, "elapsed_time": "16:35:47", "remaining_time": "1:31:03", "throughput": 3348.75, "total_tokens": 200078064} +{"current_steps": 164540, "total_steps": 179580, "loss": 0.651, "lr": 1.060880542844228e-06, "epoch": 18.324980510079072, "percentage": 91.62, "elapsed_time": "16:35:48", "remaining_time": "1:31:01", "throughput": 3348.75, "total_tokens": 200083696} +{"current_steps": 164545, "total_steps": 179580, "loss": 0.8305, "lr": 1.060180361403354e-06, "epoch": 18.325537364962692, "percentage": 91.63, "elapsed_time": "16:35:50", "remaining_time": "1:30:59", "throughput": 3348.75, "total_tokens": 200089936} +{"current_steps": 164550, "total_steps": 179580, "loss": 0.8829, "lr": 1.0594804060932522e-06, "epoch": 18.326094219846308, "percentage": 91.63, "elapsed_time": "16:35:52", "remaining_time": "1:30:57", "throughput": 3348.76, "total_tokens": 200095696} +{"current_steps": 164555, "total_steps": 179580, "loss": 0.9065, "lr": 1.0587806769205426e-06, "epoch": 18.326651074729924, "percentage": 91.63, "elapsed_time": "16:35:54", "remaining_time": "1:30:55", "throughput": 3348.76, "total_tokens": 200101840} +{"current_steps": 164560, "total_steps": 179580, "loss": 0.6922, "lr": 1.0580811738918284e-06, "epoch": 18.327207929613543, "percentage": 91.64, "elapsed_time": "16:35:55", "remaining_time": "1:30:54", "throughput": 3348.76, "total_tokens": 200107664} +{"current_steps": 164565, "total_steps": 179580, "loss": 0.8078, "lr": 1.0573818970137233e-06, "epoch": 18.32776478449716, "percentage": 91.64, "elapsed_time": "16:35:57", "remaining_time": "1:30:52", "throughput": 3348.76, "total_tokens": 200113584} +{"current_steps": 164570, "total_steps": 179580, "loss": 0.8202, "lr": 1.056682846292828e-06, "epoch": 18.32832163938078, "percentage": 91.64, "elapsed_time": "16:35:59", "remaining_time": "1:30:50", "throughput": 3348.77, "total_tokens": 200119824} +{"current_steps": 164575, "total_steps": 179580, "loss": 0.7816, "lr": 1.0559840217357452e-06, "epoch": 18.328878494264394, "percentage": 91.64, "elapsed_time": "16:36:00", "remaining_time": "1:30:48", "throughput": 3348.77, "total_tokens": 200125744} +{"current_steps": 164580, "total_steps": 179580, "loss": 0.7681, "lr": 1.0552854233490754e-06, "epoch": 18.329435349148014, "percentage": 91.65, "elapsed_time": "16:36:02", "remaining_time": "1:30:46", "throughput": 3348.77, "total_tokens": 200132016} +{"current_steps": 164585, "total_steps": 179580, "loss": 0.9568, "lr": 1.0545870511394218e-06, "epoch": 18.32999220403163, "percentage": 91.65, "elapsed_time": "16:36:04", "remaining_time": "1:30:45", "throughput": 3348.78, "total_tokens": 200138064} +{"current_steps": 164590, "total_steps": 179580, "loss": 0.6892, "lr": 1.053888905113376e-06, "epoch": 18.330549058915246, "percentage": 91.65, "elapsed_time": "16:36:06", "remaining_time": "1:30:43", "throughput": 3348.78, "total_tokens": 200144208} +{"current_steps": 164595, "total_steps": 179580, "loss": 0.6545, "lr": 1.0531909852775385e-06, "epoch": 18.331105913798865, "percentage": 91.66, "elapsed_time": "16:36:08", "remaining_time": "1:30:41", "throughput": 3348.79, "total_tokens": 200150480} +{"current_steps": 164600, "total_steps": 179580, "loss": 0.6415, "lr": 1.0524932916384928e-06, "epoch": 18.33166276868248, "percentage": 91.66, "elapsed_time": "16:36:09", "remaining_time": "1:30:39", "throughput": 3348.79, "total_tokens": 200156464} +{"current_steps": 164605, "total_steps": 179580, "loss": 0.6575, "lr": 1.0517958242028364e-06, "epoch": 18.3322196235661, "percentage": 91.66, "elapsed_time": "16:36:11", "remaining_time": "1:30:37", "throughput": 3348.8, "total_tokens": 200162640} +{"current_steps": 164610, "total_steps": 179580, "loss": 0.6298, "lr": 1.051098582977153e-06, "epoch": 18.332776478449716, "percentage": 91.66, "elapsed_time": "16:36:13", "remaining_time": "1:30:35", "throughput": 3348.8, "total_tokens": 200169168} +{"current_steps": 164615, "total_steps": 179580, "loss": 0.7628, "lr": 1.0504015679680373e-06, "epoch": 18.333333333333332, "percentage": 91.67, "elapsed_time": "16:36:15", "remaining_time": "1:30:34", "throughput": 3348.8, "total_tokens": 200175312} +{"current_steps": 164620, "total_steps": 179580, "loss": 0.8342, "lr": 1.0497047791820619e-06, "epoch": 18.33389018821695, "percentage": 91.67, "elapsed_time": "16:36:16", "remaining_time": "1:30:32", "throughput": 3348.81, "total_tokens": 200181680} +{"current_steps": 164625, "total_steps": 179580, "loss": 0.565, "lr": 1.0490082166258159e-06, "epoch": 18.334447043100567, "percentage": 91.67, "elapsed_time": "16:36:18", "remaining_time": "1:30:30", "throughput": 3348.81, "total_tokens": 200188016} +{"current_steps": 164630, "total_steps": 179580, "loss": 0.6668, "lr": 1.0483118803058745e-06, "epoch": 18.335003897984187, "percentage": 91.68, "elapsed_time": "16:36:20", "remaining_time": "1:30:28", "throughput": 3348.82, "total_tokens": 200193968} +{"current_steps": 164635, "total_steps": 179580, "loss": 0.9341, "lr": 1.0476157702288187e-06, "epoch": 18.335560752867803, "percentage": 91.68, "elapsed_time": "16:36:22", "remaining_time": "1:30:26", "throughput": 3348.82, "total_tokens": 200200112} +{"current_steps": 164640, "total_steps": 179580, "loss": 0.6237, "lr": 1.0469198864012236e-06, "epoch": 18.33611760775142, "percentage": 91.68, "elapsed_time": "16:36:24", "remaining_time": "1:30:25", "throughput": 3348.82, "total_tokens": 200206000} +{"current_steps": 164645, "total_steps": 179580, "loss": 0.613, "lr": 1.0462242288296593e-06, "epoch": 18.336674462635038, "percentage": 91.68, "elapsed_time": "16:36:25", "remaining_time": "1:30:23", "throughput": 3348.83, "total_tokens": 200212368} +{"current_steps": 164650, "total_steps": 179580, "loss": 0.6903, "lr": 1.045528797520695e-06, "epoch": 18.337231317518654, "percentage": 91.69, "elapsed_time": "16:36:27", "remaining_time": "1:30:21", "throughput": 3348.83, "total_tokens": 200218544} +{"current_steps": 164655, "total_steps": 179580, "loss": 0.9, "lr": 1.0448335924809093e-06, "epoch": 18.337788172402274, "percentage": 91.69, "elapsed_time": "16:36:29", "remaining_time": "1:30:19", "throughput": 3348.83, "total_tokens": 200223824} +{"current_steps": 164660, "total_steps": 179580, "loss": 0.587, "lr": 1.0441386137168608e-06, "epoch": 18.33834502728589, "percentage": 91.69, "elapsed_time": "16:36:30", "remaining_time": "1:30:17", "throughput": 3348.83, "total_tokens": 200229552} +{"current_steps": 164665, "total_steps": 179580, "loss": 0.9211, "lr": 1.043443861235116e-06, "epoch": 18.338901882169505, "percentage": 91.69, "elapsed_time": "16:36:32", "remaining_time": "1:30:15", "throughput": 3348.84, "total_tokens": 200235792} +{"current_steps": 164670, "total_steps": 179580, "loss": 0.5743, "lr": 1.0427493350422368e-06, "epoch": 18.339458737053125, "percentage": 91.7, "elapsed_time": "16:36:34", "remaining_time": "1:30:14", "throughput": 3348.84, "total_tokens": 200241776} +{"current_steps": 164675, "total_steps": 179580, "loss": 0.6221, "lr": 1.0420550351447844e-06, "epoch": 18.34001559193674, "percentage": 91.7, "elapsed_time": "16:36:36", "remaining_time": "1:30:12", "throughput": 3348.84, "total_tokens": 200248080} +{"current_steps": 164680, "total_steps": 179580, "loss": 0.5824, "lr": 1.0413609615493147e-06, "epoch": 18.34057244682036, "percentage": 91.7, "elapsed_time": "16:36:37", "remaining_time": "1:30:10", "throughput": 3348.85, "total_tokens": 200254320} +{"current_steps": 164685, "total_steps": 179580, "loss": 0.9071, "lr": 1.0406671142623947e-06, "epoch": 18.341129301703976, "percentage": 91.71, "elapsed_time": "16:36:39", "remaining_time": "1:30:08", "throughput": 3348.85, "total_tokens": 200260496} +{"current_steps": 164690, "total_steps": 179580, "loss": 0.6802, "lr": 1.0399734932905608e-06, "epoch": 18.341686156587592, "percentage": 91.71, "elapsed_time": "16:36:41", "remaining_time": "1:30:06", "throughput": 3348.85, "total_tokens": 200266448} +{"current_steps": 164695, "total_steps": 179580, "loss": 0.8788, "lr": 1.0392800986403772e-06, "epoch": 18.34224301147121, "percentage": 91.71, "elapsed_time": "16:36:43", "remaining_time": "1:30:04", "throughput": 3348.86, "total_tokens": 200271824} +{"current_steps": 164700, "total_steps": 179580, "loss": 0.7325, "lr": 1.0385869303183888e-06, "epoch": 18.342799866354827, "percentage": 91.71, "elapsed_time": "16:36:44", "remaining_time": "1:30:03", "throughput": 3348.86, "total_tokens": 200278160} +{"current_steps": 164705, "total_steps": 179580, "loss": 0.868, "lr": 1.0378939883311457e-06, "epoch": 18.343356721238447, "percentage": 91.72, "elapsed_time": "16:36:46", "remaining_time": "1:30:01", "throughput": 3348.86, "total_tokens": 200284272} +{"current_steps": 164710, "total_steps": 179580, "loss": 0.5245, "lr": 1.0372012726851926e-06, "epoch": 18.343913576122063, "percentage": 91.72, "elapsed_time": "16:36:48", "remaining_time": "1:29:59", "throughput": 3348.86, "total_tokens": 200290192} +{"current_steps": 164715, "total_steps": 179580, "loss": 0.8731, "lr": 1.0365087833870718e-06, "epoch": 18.34447043100568, "percentage": 91.72, "elapsed_time": "16:36:50", "remaining_time": "1:29:57", "throughput": 3348.87, "total_tokens": 200295856} +{"current_steps": 164720, "total_steps": 179580, "loss": 0.7639, "lr": 1.0358165204433223e-06, "epoch": 18.345027285889298, "percentage": 91.73, "elapsed_time": "16:36:51", "remaining_time": "1:29:55", "throughput": 3348.87, "total_tokens": 200302320} +{"current_steps": 164725, "total_steps": 179580, "loss": 0.7055, "lr": 1.035124483860489e-06, "epoch": 18.345584140772914, "percentage": 91.73, "elapsed_time": "16:36:53", "remaining_time": "1:29:54", "throughput": 3348.87, "total_tokens": 200308336} +{"current_steps": 164730, "total_steps": 179580, "loss": 0.9046, "lr": 1.0344326736451027e-06, "epoch": 18.346140995656533, "percentage": 91.73, "elapsed_time": "16:36:55", "remaining_time": "1:29:52", "throughput": 3348.88, "total_tokens": 200314224} +{"current_steps": 164735, "total_steps": 179580, "loss": 1.0114, "lr": 1.0337410898037026e-06, "epoch": 18.34669785054015, "percentage": 91.73, "elapsed_time": "16:36:57", "remaining_time": "1:29:50", "throughput": 3348.88, "total_tokens": 200320336} +{"current_steps": 164740, "total_steps": 179580, "loss": 0.7482, "lr": 1.0330497323428168e-06, "epoch": 18.347254705423765, "percentage": 91.74, "elapsed_time": "16:36:58", "remaining_time": "1:29:48", "throughput": 3348.88, "total_tokens": 200326064} +{"current_steps": 164745, "total_steps": 179580, "loss": 0.6952, "lr": 1.0323586012689818e-06, "epoch": 18.347811560307385, "percentage": 91.74, "elapsed_time": "16:37:00", "remaining_time": "1:29:46", "throughput": 3348.89, "total_tokens": 200331856} +{"current_steps": 164750, "total_steps": 179580, "loss": 0.4717, "lr": 1.0316676965887173e-06, "epoch": 18.348368415191, "percentage": 91.74, "elapsed_time": "16:37:02", "remaining_time": "1:29:44", "throughput": 3348.89, "total_tokens": 200337712} +{"current_steps": 164755, "total_steps": 179580, "loss": 1.0038, "lr": 1.0309770183085572e-06, "epoch": 18.34892527007462, "percentage": 91.74, "elapsed_time": "16:37:03", "remaining_time": "1:29:43", "throughput": 3348.89, "total_tokens": 200343952} +{"current_steps": 164760, "total_steps": 179580, "loss": 0.7153, "lr": 1.0302865664350265e-06, "epoch": 18.349482124958236, "percentage": 91.75, "elapsed_time": "16:37:05", "remaining_time": "1:29:41", "throughput": 3348.9, "total_tokens": 200350288} +{"current_steps": 164765, "total_steps": 179580, "loss": 0.7555, "lr": 1.0295963409746394e-06, "epoch": 18.35003897984185, "percentage": 91.75, "elapsed_time": "16:37:07", "remaining_time": "1:29:39", "throughput": 3348.9, "total_tokens": 200356656} +{"current_steps": 164770, "total_steps": 179580, "loss": 0.6427, "lr": 1.028906341933919e-06, "epoch": 18.35059583472547, "percentage": 91.75, "elapsed_time": "16:37:09", "remaining_time": "1:29:37", "throughput": 3348.91, "total_tokens": 200363280} +{"current_steps": 164775, "total_steps": 179580, "loss": 0.6192, "lr": 1.0282165693193846e-06, "epoch": 18.351152689609087, "percentage": 91.76, "elapsed_time": "16:37:11", "remaining_time": "1:29:35", "throughput": 3348.9, "total_tokens": 200369392} +{"current_steps": 164780, "total_steps": 179580, "loss": 0.523, "lr": 1.0275270231375533e-06, "epoch": 18.351709544492707, "percentage": 91.76, "elapsed_time": "16:37:13", "remaining_time": "1:29:34", "throughput": 3348.9, "total_tokens": 200375376} +{"current_steps": 164785, "total_steps": 179580, "loss": 0.5704, "lr": 1.026837703394934e-06, "epoch": 18.352266399376322, "percentage": 91.76, "elapsed_time": "16:37:14", "remaining_time": "1:29:32", "throughput": 3348.91, "total_tokens": 200381648} +{"current_steps": 164790, "total_steps": 179580, "loss": 0.5429, "lr": 1.026148610098035e-06, "epoch": 18.35282325425994, "percentage": 91.76, "elapsed_time": "16:37:16", "remaining_time": "1:29:30", "throughput": 3348.91, "total_tokens": 200387504} +{"current_steps": 164795, "total_steps": 179580, "loss": 1.0245, "lr": 1.0254597432533763e-06, "epoch": 18.353380109143558, "percentage": 91.77, "elapsed_time": "16:37:18", "remaining_time": "1:29:28", "throughput": 3348.91, "total_tokens": 200393264} +{"current_steps": 164800, "total_steps": 179580, "loss": 0.6405, "lr": 1.024771102867453e-06, "epoch": 18.353936964027174, "percentage": 91.77, "elapsed_time": "16:37:20", "remaining_time": "1:29:26", "throughput": 3348.92, "total_tokens": 200399760} +{"current_steps": 164805, "total_steps": 179580, "loss": 0.5259, "lr": 1.0240826889467814e-06, "epoch": 18.354493818910793, "percentage": 91.77, "elapsed_time": "16:37:21", "remaining_time": "1:29:24", "throughput": 3348.92, "total_tokens": 200405936} +{"current_steps": 164810, "total_steps": 179580, "loss": 0.7329, "lr": 1.023394501497854e-06, "epoch": 18.35505067379441, "percentage": 91.78, "elapsed_time": "16:37:23", "remaining_time": "1:29:23", "throughput": 3348.92, "total_tokens": 200411728} +{"current_steps": 164815, "total_steps": 179580, "loss": 0.7562, "lr": 1.0227065405271768e-06, "epoch": 18.355607528678025, "percentage": 91.78, "elapsed_time": "16:37:25", "remaining_time": "1:29:21", "throughput": 3348.92, "total_tokens": 200417520} +{"current_steps": 164820, "total_steps": 179580, "loss": 0.7244, "lr": 1.0220188060412445e-06, "epoch": 18.356164383561644, "percentage": 91.78, "elapsed_time": "16:37:27", "remaining_time": "1:29:19", "throughput": 3348.93, "total_tokens": 200423344} +{"current_steps": 164825, "total_steps": 179580, "loss": 0.6631, "lr": 1.0213312980465573e-06, "epoch": 18.35672123844526, "percentage": 91.78, "elapsed_time": "16:37:28", "remaining_time": "1:29:17", "throughput": 3348.93, "total_tokens": 200429104} +{"current_steps": 164830, "total_steps": 179580, "loss": 0.8112, "lr": 1.0206440165496073e-06, "epoch": 18.35727809332888, "percentage": 91.79, "elapsed_time": "16:37:30", "remaining_time": "1:29:15", "throughput": 3348.93, "total_tokens": 200434576} +{"current_steps": 164835, "total_steps": 179580, "loss": 0.6771, "lr": 1.0199569615568865e-06, "epoch": 18.357834948212496, "percentage": 91.79, "elapsed_time": "16:37:32", "remaining_time": "1:29:13", "throughput": 3348.94, "total_tokens": 200440816} +{"current_steps": 164840, "total_steps": 179580, "loss": 0.7676, "lr": 1.0192701330748816e-06, "epoch": 18.35839180309611, "percentage": 91.79, "elapsed_time": "16:37:33", "remaining_time": "1:29:12", "throughput": 3348.94, "total_tokens": 200446736} +{"current_steps": 164845, "total_steps": 179580, "loss": 0.6126, "lr": 1.0185835311100871e-06, "epoch": 18.35894865797973, "percentage": 91.79, "elapsed_time": "16:37:35", "remaining_time": "1:29:10", "throughput": 3348.94, "total_tokens": 200452880} +{"current_steps": 164850, "total_steps": 179580, "loss": 0.9034, "lr": 1.0178971556689843e-06, "epoch": 18.359505512863347, "percentage": 91.8, "elapsed_time": "16:37:37", "remaining_time": "1:29:08", "throughput": 3348.94, "total_tokens": 200458704} +{"current_steps": 164855, "total_steps": 179580, "loss": 0.6532, "lr": 1.0172110067580565e-06, "epoch": 18.360062367746966, "percentage": 91.8, "elapsed_time": "16:37:38", "remaining_time": "1:29:06", "throughput": 3348.95, "total_tokens": 200464496} +{"current_steps": 164860, "total_steps": 179580, "loss": 0.495, "lr": 1.0165250843837848e-06, "epoch": 18.360619222630582, "percentage": 91.8, "elapsed_time": "16:37:40", "remaining_time": "1:29:04", "throughput": 3348.95, "total_tokens": 200470672} +{"current_steps": 164865, "total_steps": 179580, "loss": 0.6387, "lr": 1.01583938855265e-06, "epoch": 18.361176077514198, "percentage": 91.81, "elapsed_time": "16:37:42", "remaining_time": "1:29:03", "throughput": 3348.95, "total_tokens": 200476624} +{"current_steps": 164870, "total_steps": 179580, "loss": 0.6514, "lr": 1.0151539192711251e-06, "epoch": 18.361732932397818, "percentage": 91.81, "elapsed_time": "16:37:44", "remaining_time": "1:29:01", "throughput": 3348.96, "total_tokens": 200482960} +{"current_steps": 164875, "total_steps": 179580, "loss": 0.6611, "lr": 1.0144686765456934e-06, "epoch": 18.362289787281433, "percentage": 91.81, "elapsed_time": "16:37:46", "remaining_time": "1:28:59", "throughput": 3348.96, "total_tokens": 200489264} +{"current_steps": 164880, "total_steps": 179580, "loss": 0.7955, "lr": 1.0137836603828165e-06, "epoch": 18.362846642165053, "percentage": 91.81, "elapsed_time": "16:37:47", "remaining_time": "1:28:57", "throughput": 3348.97, "total_tokens": 200495568} +{"current_steps": 164885, "total_steps": 179580, "loss": 0.6711, "lr": 1.0130988707889727e-06, "epoch": 18.36340349704867, "percentage": 91.82, "elapsed_time": "16:37:49", "remaining_time": "1:28:55", "throughput": 3348.97, "total_tokens": 200501552} +{"current_steps": 164890, "total_steps": 179580, "loss": 0.7388, "lr": 1.012414307770626e-06, "epoch": 18.363960351932285, "percentage": 91.82, "elapsed_time": "16:37:51", "remaining_time": "1:28:53", "throughput": 3348.97, "total_tokens": 200507632} +{"current_steps": 164895, "total_steps": 179580, "loss": 0.5729, "lr": 1.0117299713342466e-06, "epoch": 18.364517206815904, "percentage": 91.82, "elapsed_time": "16:37:53", "remaining_time": "1:28:52", "throughput": 3348.98, "total_tokens": 200513968} +{"current_steps": 164900, "total_steps": 179580, "loss": 0.8528, "lr": 1.0110458614862983e-06, "epoch": 18.36507406169952, "percentage": 91.83, "elapsed_time": "16:37:54", "remaining_time": "1:28:50", "throughput": 3348.98, "total_tokens": 200519984} +{"current_steps": 164905, "total_steps": 179580, "loss": 0.6765, "lr": 1.0103619782332403e-06, "epoch": 18.36563091658314, "percentage": 91.83, "elapsed_time": "16:37:56", "remaining_time": "1:28:48", "throughput": 3348.98, "total_tokens": 200525936} +{"current_steps": 164910, "total_steps": 179580, "loss": 0.6548, "lr": 1.0096783215815308e-06, "epoch": 18.366187771466755, "percentage": 91.83, "elapsed_time": "16:37:58", "remaining_time": "1:28:46", "throughput": 3348.99, "total_tokens": 200532240} +{"current_steps": 164915, "total_steps": 179580, "loss": 0.6943, "lr": 1.008994891537632e-06, "epoch": 18.366744626350375, "percentage": 91.83, "elapsed_time": "16:38:00", "remaining_time": "1:28:44", "throughput": 3348.99, "total_tokens": 200538608} +{"current_steps": 164920, "total_steps": 179580, "loss": 0.7854, "lr": 1.008311688107999e-06, "epoch": 18.36730148123399, "percentage": 91.84, "elapsed_time": "16:38:02", "remaining_time": "1:28:43", "throughput": 3348.99, "total_tokens": 200544528} +{"current_steps": 164925, "total_steps": 179580, "loss": 0.5849, "lr": 1.0076287112990856e-06, "epoch": 18.367858336117607, "percentage": 91.84, "elapsed_time": "16:38:03", "remaining_time": "1:28:41", "throughput": 3349.0, "total_tokens": 200550736} +{"current_steps": 164930, "total_steps": 179580, "loss": 0.6153, "lr": 1.0069459611173365e-06, "epoch": 18.368415191001226, "percentage": 91.84, "elapsed_time": "16:38:05", "remaining_time": "1:28:39", "throughput": 3349.0, "total_tokens": 200556592} +{"current_steps": 164935, "total_steps": 179580, "loss": 0.463, "lr": 1.0062634375692077e-06, "epoch": 18.368972045884842, "percentage": 91.84, "elapsed_time": "16:38:07", "remaining_time": "1:28:37", "throughput": 3349.0, "total_tokens": 200562544} +{"current_steps": 164940, "total_steps": 179580, "loss": 0.7787, "lr": 1.0055811406611437e-06, "epoch": 18.36952890076846, "percentage": 91.85, "elapsed_time": "16:38:09", "remaining_time": "1:28:35", "throughput": 3349.01, "total_tokens": 200568752} +{"current_steps": 164945, "total_steps": 179580, "loss": 0.8262, "lr": 1.0048990703995926e-06, "epoch": 18.370085755652077, "percentage": 91.85, "elapsed_time": "16:38:10", "remaining_time": "1:28:33", "throughput": 3349.01, "total_tokens": 200574800} +{"current_steps": 164950, "total_steps": 179580, "loss": 0.5151, "lr": 1.0042172267909933e-06, "epoch": 18.370642610535693, "percentage": 91.85, "elapsed_time": "16:38:12", "remaining_time": "1:28:32", "throughput": 3349.01, "total_tokens": 200580624} +{"current_steps": 164955, "total_steps": 179580, "loss": 0.9375, "lr": 1.0035356098417853e-06, "epoch": 18.371199465419313, "percentage": 91.86, "elapsed_time": "16:38:14", "remaining_time": "1:28:30", "throughput": 3349.01, "total_tokens": 200586544} +{"current_steps": 164960, "total_steps": 179580, "loss": 0.9085, "lr": 1.0028542195584107e-06, "epoch": 18.37175632030293, "percentage": 91.86, "elapsed_time": "16:38:15", "remaining_time": "1:28:28", "throughput": 3349.02, "total_tokens": 200592336} +{"current_steps": 164965, "total_steps": 179580, "loss": 0.8801, "lr": 1.0021730559473031e-06, "epoch": 18.372313175186548, "percentage": 91.86, "elapsed_time": "16:38:17", "remaining_time": "1:28:26", "throughput": 3349.02, "total_tokens": 200598768} +{"current_steps": 164970, "total_steps": 179580, "loss": 0.5604, "lr": 1.001492119014899e-06, "epoch": 18.372870030070164, "percentage": 91.86, "elapsed_time": "16:38:19", "remaining_time": "1:28:24", "throughput": 3349.03, "total_tokens": 200605104} +{"current_steps": 164975, "total_steps": 179580, "loss": 0.6026, "lr": 1.0008114087676296e-06, "epoch": 18.37342688495378, "percentage": 91.87, "elapsed_time": "16:38:21", "remaining_time": "1:28:22", "throughput": 3349.03, "total_tokens": 200611536} +{"current_steps": 164980, "total_steps": 179580, "loss": 0.8124, "lr": 1.0001309252119228e-06, "epoch": 18.3739837398374, "percentage": 91.87, "elapsed_time": "16:38:23", "remaining_time": "1:28:21", "throughput": 3349.04, "total_tokens": 200617840} +{"current_steps": 164985, "total_steps": 179580, "loss": 0.6572, "lr": 9.99450668354207e-07, "epoch": 18.374540594721015, "percentage": 91.87, "elapsed_time": "16:38:24", "remaining_time": "1:28:19", "throughput": 3349.04, "total_tokens": 200623408} +{"current_steps": 164990, "total_steps": 179580, "loss": 0.691, "lr": 9.987706382009104e-07, "epoch": 18.375097449604635, "percentage": 91.88, "elapsed_time": "16:38:26", "remaining_time": "1:28:17", "throughput": 3349.04, "total_tokens": 200629648} +{"current_steps": 164995, "total_steps": 179580, "loss": 0.5637, "lr": 9.980908347584556e-07, "epoch": 18.37565430448825, "percentage": 91.88, "elapsed_time": "16:38:28", "remaining_time": "1:28:15", "throughput": 3349.04, "total_tokens": 200635792} +{"current_steps": 165000, "total_steps": 179580, "loss": 0.7285, "lr": 9.974112580332623e-07, "epoch": 18.376211159371866, "percentage": 91.88, "elapsed_time": "16:38:30", "remaining_time": "1:28:13", "throughput": 3349.05, "total_tokens": 200642288} +{"current_steps": 165005, "total_steps": 179580, "loss": 0.7721, "lr": 9.96731908031745e-07, "epoch": 18.376768014255486, "percentage": 91.88, "elapsed_time": "16:38:32", "remaining_time": "1:28:12", "throughput": 3349.05, "total_tokens": 200648592} +{"current_steps": 165010, "total_steps": 179580, "loss": 1.0339, "lr": 9.960527847603318e-07, "epoch": 18.377324869139102, "percentage": 91.89, "elapsed_time": "16:38:33", "remaining_time": "1:28:10", "throughput": 3349.06, "total_tokens": 200654608} +{"current_steps": 165015, "total_steps": 179580, "loss": 0.7374, "lr": 9.953738882254287e-07, "epoch": 18.37788172402272, "percentage": 91.89, "elapsed_time": "16:38:35", "remaining_time": "1:28:08", "throughput": 3349.06, "total_tokens": 200660528} +{"current_steps": 165020, "total_steps": 179580, "loss": 0.6644, "lr": 9.946952184334558e-07, "epoch": 18.378438578906337, "percentage": 91.89, "elapsed_time": "16:38:37", "remaining_time": "1:28:06", "throughput": 3349.07, "total_tokens": 200666704} +{"current_steps": 165025, "total_steps": 179580, "loss": 0.6584, "lr": 9.940167753908158e-07, "epoch": 18.378995433789953, "percentage": 91.89, "elapsed_time": "16:38:39", "remaining_time": "1:28:04", "throughput": 3349.07, "total_tokens": 200672816} +{"current_steps": 165030, "total_steps": 179580, "loss": 0.9589, "lr": 9.933385591039207e-07, "epoch": 18.379552288673572, "percentage": 91.9, "elapsed_time": "16:38:40", "remaining_time": "1:28:02", "throughput": 3349.07, "total_tokens": 200678352} +{"current_steps": 165035, "total_steps": 179580, "loss": 0.7045, "lr": 9.926605695791734e-07, "epoch": 18.38010914355719, "percentage": 91.9, "elapsed_time": "16:38:42", "remaining_time": "1:28:01", "throughput": 3349.07, "total_tokens": 200684592} +{"current_steps": 165040, "total_steps": 179580, "loss": 0.6767, "lr": 9.919828068229885e-07, "epoch": 18.380665998440808, "percentage": 91.9, "elapsed_time": "16:38:44", "remaining_time": "1:27:59", "throughput": 3349.08, "total_tokens": 200690832} +{"current_steps": 165045, "total_steps": 179580, "loss": 0.674, "lr": 9.91305270841758e-07, "epoch": 18.381222853324424, "percentage": 91.91, "elapsed_time": "16:38:45", "remaining_time": "1:27:57", "throughput": 3349.08, "total_tokens": 200696816} +{"current_steps": 165050, "total_steps": 179580, "loss": 0.7722, "lr": 9.906279616418852e-07, "epoch": 18.38177970820804, "percentage": 91.91, "elapsed_time": "16:38:47", "remaining_time": "1:27:55", "throughput": 3349.08, "total_tokens": 200702832} +{"current_steps": 165055, "total_steps": 179580, "loss": 0.569, "lr": 9.899508792297618e-07, "epoch": 18.38233656309166, "percentage": 91.91, "elapsed_time": "16:38:49", "remaining_time": "1:27:53", "throughput": 3349.09, "total_tokens": 200708560} +{"current_steps": 165060, "total_steps": 179580, "loss": 0.9321, "lr": 9.892740236117942e-07, "epoch": 18.382893417975275, "percentage": 91.91, "elapsed_time": "16:38:51", "remaining_time": "1:27:52", "throughput": 3349.09, "total_tokens": 200714480} +{"current_steps": 165065, "total_steps": 179580, "loss": 0.8225, "lr": 9.885973947943717e-07, "epoch": 18.383450272858894, "percentage": 91.92, "elapsed_time": "16:38:52", "remaining_time": "1:27:50", "throughput": 3349.09, "total_tokens": 200720400} +{"current_steps": 165070, "total_steps": 179580, "loss": 0.5542, "lr": 9.879209927838835e-07, "epoch": 18.38400712774251, "percentage": 91.92, "elapsed_time": "16:38:54", "remaining_time": "1:27:48", "throughput": 3349.1, "total_tokens": 200726352} +{"current_steps": 165075, "total_steps": 179580, "loss": 0.6466, "lr": 9.872448175867161e-07, "epoch": 18.384563982626126, "percentage": 91.92, "elapsed_time": "16:38:56", "remaining_time": "1:27:46", "throughput": 3349.1, "total_tokens": 200732144} +{"current_steps": 165080, "total_steps": 179580, "loss": 0.5716, "lr": 9.865688692092617e-07, "epoch": 18.385120837509746, "percentage": 91.93, "elapsed_time": "16:38:57", "remaining_time": "1:27:44", "throughput": 3349.1, "total_tokens": 200737904} +{"current_steps": 165085, "total_steps": 179580, "loss": 0.7178, "lr": 9.858931476579042e-07, "epoch": 18.38567769239336, "percentage": 91.93, "elapsed_time": "16:38:59", "remaining_time": "1:27:42", "throughput": 3349.1, "total_tokens": 200743504} +{"current_steps": 165090, "total_steps": 179580, "loss": 0.6978, "lr": 9.8521765293903e-07, "epoch": 18.38623454727698, "percentage": 91.93, "elapsed_time": "16:39:01", "remaining_time": "1:27:41", "throughput": 3349.11, "total_tokens": 200749808} +{"current_steps": 165095, "total_steps": 179580, "loss": 0.6748, "lr": 9.845423850590092e-07, "epoch": 18.386791402160597, "percentage": 91.93, "elapsed_time": "16:39:03", "remaining_time": "1:27:39", "throughput": 3349.11, "total_tokens": 200755760} +{"current_steps": 165100, "total_steps": 179580, "loss": 0.7435, "lr": 9.83867344024228e-07, "epoch": 18.387348257044213, "percentage": 91.94, "elapsed_time": "16:39:04", "remaining_time": "1:27:37", "throughput": 3349.11, "total_tokens": 200762064} +{"current_steps": 165105, "total_steps": 179580, "loss": 0.6857, "lr": 9.831925298410593e-07, "epoch": 18.387905111927832, "percentage": 91.94, "elapsed_time": "16:39:06", "remaining_time": "1:27:35", "throughput": 3349.11, "total_tokens": 200767824} +{"current_steps": 165110, "total_steps": 179580, "loss": 0.6144, "lr": 9.825179425158814e-07, "epoch": 18.388461966811448, "percentage": 91.94, "elapsed_time": "16:39:08", "remaining_time": "1:27:33", "throughput": 3349.12, "total_tokens": 200773520} +{"current_steps": 165115, "total_steps": 179580, "loss": 0.6711, "lr": 9.81843582055067e-07, "epoch": 18.389018821695068, "percentage": 91.95, "elapsed_time": "16:39:10", "remaining_time": "1:27:31", "throughput": 3349.12, "total_tokens": 200779952} +{"current_steps": 165120, "total_steps": 179580, "loss": 0.735, "lr": 9.811694484649802e-07, "epoch": 18.389575676578684, "percentage": 91.95, "elapsed_time": "16:39:11", "remaining_time": "1:27:30", "throughput": 3349.13, "total_tokens": 200786288} +{"current_steps": 165125, "total_steps": 179580, "loss": 0.6414, "lr": 9.804955417519884e-07, "epoch": 18.3901325314623, "percentage": 91.95, "elapsed_time": "16:39:13", "remaining_time": "1:27:28", "throughput": 3349.13, "total_tokens": 200792240} +{"current_steps": 165130, "total_steps": 179580, "loss": 0.6549, "lr": 9.798218619224641e-07, "epoch": 18.39068938634592, "percentage": 91.95, "elapsed_time": "16:39:15", "remaining_time": "1:27:26", "throughput": 3349.13, "total_tokens": 200798160} +{"current_steps": 165135, "total_steps": 179580, "loss": 0.71, "lr": 9.79148408982769e-07, "epoch": 18.391246241229535, "percentage": 91.96, "elapsed_time": "16:39:17", "remaining_time": "1:27:24", "throughput": 3349.14, "total_tokens": 200804272} +{"current_steps": 165140, "total_steps": 179580, "loss": 0.8085, "lr": 9.784751829392592e-07, "epoch": 18.391803096113154, "percentage": 91.96, "elapsed_time": "16:39:18", "remaining_time": "1:27:22", "throughput": 3349.14, "total_tokens": 200809968} +{"current_steps": 165145, "total_steps": 179580, "loss": 0.6353, "lr": 9.77802183798296e-07, "epoch": 18.39235995099677, "percentage": 91.96, "elapsed_time": "16:39:20", "remaining_time": "1:27:21", "throughput": 3349.14, "total_tokens": 200816400} +{"current_steps": 165150, "total_steps": 179580, "loss": 0.6344, "lr": 9.771294115662383e-07, "epoch": 18.392916805880386, "percentage": 91.96, "elapsed_time": "16:39:22", "remaining_time": "1:27:19", "throughput": 3349.14, "total_tokens": 200822448} +{"current_steps": 165155, "total_steps": 179580, "loss": 0.7497, "lr": 9.764568662494395e-07, "epoch": 18.393473660764005, "percentage": 91.97, "elapsed_time": "16:39:23", "remaining_time": "1:27:17", "throughput": 3349.15, "total_tokens": 200828144} +{"current_steps": 165160, "total_steps": 179580, "loss": 0.6352, "lr": 9.757845478542554e-07, "epoch": 18.39403051564762, "percentage": 91.97, "elapsed_time": "16:39:25", "remaining_time": "1:27:15", "throughput": 3349.15, "total_tokens": 200834064} +{"current_steps": 165165, "total_steps": 179580, "loss": 0.9246, "lr": 9.751124563870312e-07, "epoch": 18.39458737053124, "percentage": 91.97, "elapsed_time": "16:39:27", "remaining_time": "1:27:13", "throughput": 3349.15, "total_tokens": 200840048} +{"current_steps": 165170, "total_steps": 179580, "loss": 0.6753, "lr": 9.744405918541227e-07, "epoch": 18.395144225414857, "percentage": 91.98, "elapsed_time": "16:39:29", "remaining_time": "1:27:11", "throughput": 3349.15, "total_tokens": 200846032} +{"current_steps": 165175, "total_steps": 179580, "loss": 0.799, "lr": 9.737689542618667e-07, "epoch": 18.395701080298473, "percentage": 91.98, "elapsed_time": "16:39:30", "remaining_time": "1:27:10", "throughput": 3349.16, "total_tokens": 200852016} +{"current_steps": 165180, "total_steps": 179580, "loss": 0.4997, "lr": 9.730975436166134e-07, "epoch": 18.396257935182092, "percentage": 91.98, "elapsed_time": "16:39:32", "remaining_time": "1:27:08", "throughput": 3349.16, "total_tokens": 200858064} +{"current_steps": 165185, "total_steps": 179580, "loss": 0.5944, "lr": 9.72426359924708e-07, "epoch": 18.396814790065708, "percentage": 91.98, "elapsed_time": "16:39:34", "remaining_time": "1:27:06", "throughput": 3349.16, "total_tokens": 200864016} +{"current_steps": 165190, "total_steps": 179580, "loss": 0.7159, "lr": 9.71755403192484e-07, "epoch": 18.397371644949327, "percentage": 91.99, "elapsed_time": "16:39:36", "remaining_time": "1:27:04", "throughput": 3349.17, "total_tokens": 200870192} +{"current_steps": 165195, "total_steps": 179580, "loss": 0.7165, "lr": 9.710846734262785e-07, "epoch": 18.397928499832943, "percentage": 91.99, "elapsed_time": "16:39:37", "remaining_time": "1:27:02", "throughput": 3349.17, "total_tokens": 200876144} +{"current_steps": 165200, "total_steps": 179580, "loss": 0.5185, "lr": 9.704141706324304e-07, "epoch": 18.39848535471656, "percentage": 91.99, "elapsed_time": "16:39:39", "remaining_time": "1:27:00", "throughput": 3349.17, "total_tokens": 200881872} +{"current_steps": 165205, "total_steps": 179580, "loss": 0.614, "lr": 9.697438948172737e-07, "epoch": 18.39904220960018, "percentage": 92.0, "elapsed_time": "16:39:41", "remaining_time": "1:26:59", "throughput": 3349.18, "total_tokens": 200888240} +{"current_steps": 165210, "total_steps": 179580, "loss": 0.6951, "lr": 9.690738459871424e-07, "epoch": 18.399599064483795, "percentage": 92.0, "elapsed_time": "16:39:43", "remaining_time": "1:26:57", "throughput": 3349.18, "total_tokens": 200894224} +{"current_steps": 165215, "total_steps": 179580, "loss": 1.0271, "lr": 9.68404024148356e-07, "epoch": 18.400155919367414, "percentage": 92.0, "elapsed_time": "16:39:44", "remaining_time": "1:26:55", "throughput": 3349.19, "total_tokens": 200900240} +{"current_steps": 165220, "total_steps": 179580, "loss": 0.6949, "lr": 9.677344293072516e-07, "epoch": 18.40071277425103, "percentage": 92.0, "elapsed_time": "16:39:46", "remaining_time": "1:26:53", "throughput": 3349.19, "total_tokens": 200906160} +{"current_steps": 165225, "total_steps": 179580, "loss": 0.5997, "lr": 9.670650614701459e-07, "epoch": 18.401269629134646, "percentage": 92.01, "elapsed_time": "16:39:48", "remaining_time": "1:26:51", "throughput": 3349.19, "total_tokens": 200912592} +{"current_steps": 165230, "total_steps": 179580, "loss": 0.8195, "lr": 9.663959206433704e-07, "epoch": 18.401826484018265, "percentage": 92.01, "elapsed_time": "16:39:50", "remaining_time": "1:26:50", "throughput": 3349.2, "total_tokens": 200918832} +{"current_steps": 165235, "total_steps": 179580, "loss": 0.682, "lr": 9.65727006833239e-07, "epoch": 18.40238333890188, "percentage": 92.01, "elapsed_time": "16:39:51", "remaining_time": "1:26:48", "throughput": 3349.2, "total_tokens": 200925136} +{"current_steps": 165240, "total_steps": 179580, "loss": 0.7337, "lr": 9.650583200460721e-07, "epoch": 18.4029401937855, "percentage": 92.01, "elapsed_time": "16:39:53", "remaining_time": "1:26:46", "throughput": 3349.21, "total_tokens": 200931504} +{"current_steps": 165245, "total_steps": 179580, "loss": 0.6464, "lr": 9.643898602881812e-07, "epoch": 18.403497048669117, "percentage": 92.02, "elapsed_time": "16:39:55", "remaining_time": "1:26:44", "throughput": 3349.21, "total_tokens": 200937520} +{"current_steps": 165250, "total_steps": 179580, "loss": 0.6562, "lr": 9.63721627565889e-07, "epoch": 18.404053903552736, "percentage": 92.02, "elapsed_time": "16:39:57", "remaining_time": "1:26:42", "throughput": 3349.21, "total_tokens": 200943440} +{"current_steps": 165255, "total_steps": 179580, "loss": 0.7457, "lr": 9.630536218855068e-07, "epoch": 18.404610758436352, "percentage": 92.02, "elapsed_time": "16:39:58", "remaining_time": "1:26:40", "throughput": 3349.21, "total_tokens": 200949424} +{"current_steps": 165260, "total_steps": 179580, "loss": 0.8354, "lr": 9.623858432533383e-07, "epoch": 18.405167613319968, "percentage": 92.03, "elapsed_time": "16:40:00", "remaining_time": "1:26:39", "throughput": 3349.22, "total_tokens": 200955696} +{"current_steps": 165265, "total_steps": 179580, "loss": 0.6331, "lr": 9.617182916756894e-07, "epoch": 18.405724468203587, "percentage": 92.03, "elapsed_time": "16:40:02", "remaining_time": "1:26:37", "throughput": 3349.22, "total_tokens": 200961904} +{"current_steps": 165270, "total_steps": 179580, "loss": 0.6847, "lr": 9.610509671588774e-07, "epoch": 18.406281323087203, "percentage": 92.03, "elapsed_time": "16:40:04", "remaining_time": "1:26:35", "throughput": 3349.22, "total_tokens": 200967888} +{"current_steps": 165275, "total_steps": 179580, "loss": 0.6135, "lr": 9.603838697091944e-07, "epoch": 18.40683817797082, "percentage": 92.03, "elapsed_time": "16:40:06", "remaining_time": "1:26:33", "throughput": 3349.23, "total_tokens": 200973968} +{"current_steps": 165280, "total_steps": 179580, "loss": 0.6673, "lr": 9.59716999332952e-07, "epoch": 18.40739503285444, "percentage": 92.04, "elapsed_time": "16:40:07", "remaining_time": "1:26:31", "throughput": 3349.23, "total_tokens": 200980112} +{"current_steps": 165285, "total_steps": 179580, "loss": 0.7195, "lr": 9.590503560364366e-07, "epoch": 18.407951887738054, "percentage": 92.04, "elapsed_time": "16:40:09", "remaining_time": "1:26:30", "throughput": 3349.23, "total_tokens": 200986288} +{"current_steps": 165290, "total_steps": 179580, "loss": 0.8454, "lr": 9.583839398259548e-07, "epoch": 18.408508742621674, "percentage": 92.04, "elapsed_time": "16:40:11", "remaining_time": "1:26:28", "throughput": 3349.24, "total_tokens": 200992528} +{"current_steps": 165295, "total_steps": 179580, "loss": 0.7946, "lr": 9.577177507077955e-07, "epoch": 18.40906559750529, "percentage": 92.05, "elapsed_time": "16:40:13", "remaining_time": "1:26:26", "throughput": 3349.24, "total_tokens": 200998704} +{"current_steps": 165300, "total_steps": 179580, "loss": 0.6225, "lr": 9.570517886882568e-07, "epoch": 18.40962245238891, "percentage": 92.05, "elapsed_time": "16:40:14", "remaining_time": "1:26:24", "throughput": 3349.24, "total_tokens": 201004656} +{"current_steps": 165305, "total_steps": 179580, "loss": 0.6466, "lr": 9.56386053773628e-07, "epoch": 18.410179307272525, "percentage": 92.05, "elapsed_time": "16:40:16", "remaining_time": "1:26:22", "throughput": 3349.25, "total_tokens": 201010736} +{"current_steps": 165310, "total_steps": 179580, "loss": 0.6255, "lr": 9.557205459701957e-07, "epoch": 18.41073616215614, "percentage": 92.05, "elapsed_time": "16:40:18", "remaining_time": "1:26:20", "throughput": 3349.25, "total_tokens": 201016784} +{"current_steps": 165315, "total_steps": 179580, "loss": 0.7135, "lr": 9.550552652842437e-07, "epoch": 18.41129301703976, "percentage": 92.06, "elapsed_time": "16:40:20", "remaining_time": "1:26:19", "throughput": 3349.26, "total_tokens": 201023088} +{"current_steps": 165320, "total_steps": 179580, "loss": 0.54, "lr": 9.543902117220643e-07, "epoch": 18.411849871923376, "percentage": 92.06, "elapsed_time": "16:40:22", "remaining_time": "1:26:17", "throughput": 3349.26, "total_tokens": 201029200} +{"current_steps": 165325, "total_steps": 179580, "loss": 0.64, "lr": 9.537253852899302e-07, "epoch": 18.412406726806996, "percentage": 92.06, "elapsed_time": "16:40:23", "remaining_time": "1:26:15", "throughput": 3349.26, "total_tokens": 201035120} +{"current_steps": 165330, "total_steps": 179580, "loss": 0.7085, "lr": 9.530607859941281e-07, "epoch": 18.41296358169061, "percentage": 92.06, "elapsed_time": "16:40:25", "remaining_time": "1:26:13", "throughput": 3349.27, "total_tokens": 201041168} +{"current_steps": 165335, "total_steps": 179580, "loss": 0.7111, "lr": 9.523964138409308e-07, "epoch": 18.413520436574228, "percentage": 92.07, "elapsed_time": "16:40:27", "remaining_time": "1:26:11", "throughput": 3349.27, "total_tokens": 201047280} +{"current_steps": 165340, "total_steps": 179580, "loss": 0.8072, "lr": 9.517322688366164e-07, "epoch": 18.414077291457847, "percentage": 92.07, "elapsed_time": "16:40:28", "remaining_time": "1:26:10", "throughput": 3349.27, "total_tokens": 201053520} +{"current_steps": 165345, "total_steps": 179580, "loss": 0.5556, "lr": 9.510683509874579e-07, "epoch": 18.414634146341463, "percentage": 92.07, "elapsed_time": "16:40:30", "remaining_time": "1:26:08", "throughput": 3349.28, "total_tokens": 201059696} +{"current_steps": 165350, "total_steps": 179580, "loss": 0.9372, "lr": 9.504046602997308e-07, "epoch": 18.415191001225082, "percentage": 92.08, "elapsed_time": "16:40:32", "remaining_time": "1:26:06", "throughput": 3349.28, "total_tokens": 201065872} +{"current_steps": 165355, "total_steps": 179580, "loss": 0.5645, "lr": 9.497411967796938e-07, "epoch": 18.4157478561087, "percentage": 92.08, "elapsed_time": "16:40:34", "remaining_time": "1:26:04", "throughput": 3349.28, "total_tokens": 201071664} +{"current_steps": 165360, "total_steps": 179580, "loss": 0.6856, "lr": 9.490779604336226e-07, "epoch": 18.416304710992314, "percentage": 92.08, "elapsed_time": "16:40:36", "remaining_time": "1:26:02", "throughput": 3349.28, "total_tokens": 201077776} +{"current_steps": 165365, "total_steps": 179580, "loss": 0.586, "lr": 9.484149512677814e-07, "epoch": 18.416861565875934, "percentage": 92.08, "elapsed_time": "16:40:37", "remaining_time": "1:26:00", "throughput": 3349.29, "total_tokens": 201083760} +{"current_steps": 165370, "total_steps": 179580, "loss": 0.8533, "lr": 9.477521692884267e-07, "epoch": 18.41741842075955, "percentage": 92.09, "elapsed_time": "16:40:39", "remaining_time": "1:25:59", "throughput": 3349.29, "total_tokens": 201089488} +{"current_steps": 165375, "total_steps": 179580, "loss": 0.7565, "lr": 9.470896145018254e-07, "epoch": 18.41797527564317, "percentage": 92.09, "elapsed_time": "16:40:41", "remaining_time": "1:25:57", "throughput": 3349.3, "total_tokens": 201095536} +{"current_steps": 165380, "total_steps": 179580, "loss": 0.8587, "lr": 9.464272869142337e-07, "epoch": 18.418532130526785, "percentage": 92.09, "elapsed_time": "16:40:42", "remaining_time": "1:25:55", "throughput": 3349.3, "total_tokens": 201101296} +{"current_steps": 165385, "total_steps": 179580, "loss": 0.7858, "lr": 9.457651865319078e-07, "epoch": 18.4190889854104, "percentage": 92.1, "elapsed_time": "16:40:44", "remaining_time": "1:25:53", "throughput": 3349.3, "total_tokens": 201107376} +{"current_steps": 165390, "total_steps": 179580, "loss": 0.5578, "lr": 9.451033133610981e-07, "epoch": 18.41964584029402, "percentage": 92.1, "elapsed_time": "16:40:46", "remaining_time": "1:25:51", "throughput": 3349.31, "total_tokens": 201113648} +{"current_steps": 165395, "total_steps": 179580, "loss": 0.6124, "lr": 9.444416674080636e-07, "epoch": 18.420202695177636, "percentage": 92.1, "elapsed_time": "16:40:48", "remaining_time": "1:25:49", "throughput": 3349.31, "total_tokens": 201119632} +{"current_steps": 165400, "total_steps": 179580, "loss": 0.6955, "lr": 9.43780248679052e-07, "epoch": 18.420759550061256, "percentage": 92.1, "elapsed_time": "16:40:49", "remaining_time": "1:25:48", "throughput": 3349.32, "total_tokens": 201126032} +{"current_steps": 165405, "total_steps": 179580, "loss": 0.7342, "lr": 9.431190571803083e-07, "epoch": 18.42131640494487, "percentage": 92.11, "elapsed_time": "16:40:51", "remaining_time": "1:25:46", "throughput": 3349.32, "total_tokens": 201132400} +{"current_steps": 165410, "total_steps": 179580, "loss": 0.6886, "lr": 9.424580929180749e-07, "epoch": 18.421873259828487, "percentage": 92.11, "elapsed_time": "16:40:53", "remaining_time": "1:25:44", "throughput": 3349.33, "total_tokens": 201138832} +{"current_steps": 165415, "total_steps": 179580, "loss": 0.9072, "lr": 9.417973558986048e-07, "epoch": 18.422430114712107, "percentage": 92.11, "elapsed_time": "16:40:55", "remaining_time": "1:25:42", "throughput": 3349.33, "total_tokens": 201145168} +{"current_steps": 165420, "total_steps": 179580, "loss": 0.9091, "lr": 9.411368461281294e-07, "epoch": 18.422986969595723, "percentage": 92.11, "elapsed_time": "16:40:57", "remaining_time": "1:25:40", "throughput": 3349.33, "total_tokens": 201151152} +{"current_steps": 165425, "total_steps": 179580, "loss": 0.5837, "lr": 9.404765636128965e-07, "epoch": 18.423543824479342, "percentage": 92.12, "elapsed_time": "16:40:58", "remaining_time": "1:25:39", "throughput": 3349.34, "total_tokens": 201157552} +{"current_steps": 165430, "total_steps": 179580, "loss": 0.6587, "lr": 9.398165083591343e-07, "epoch": 18.424100679362958, "percentage": 92.12, "elapsed_time": "16:41:00", "remaining_time": "1:25:37", "throughput": 3349.34, "total_tokens": 201163632} +{"current_steps": 165435, "total_steps": 179580, "loss": 0.5518, "lr": 9.39156680373085e-07, "epoch": 18.424657534246574, "percentage": 92.12, "elapsed_time": "16:41:02", "remaining_time": "1:25:35", "throughput": 3349.34, "total_tokens": 201169840} +{"current_steps": 165440, "total_steps": 179580, "loss": 0.8436, "lr": 9.384970796609771e-07, "epoch": 18.425214389130193, "percentage": 92.13, "elapsed_time": "16:41:04", "remaining_time": "1:25:33", "throughput": 3349.35, "total_tokens": 201176112} +{"current_steps": 165445, "total_steps": 179580, "loss": 0.6437, "lr": 9.378377062290417e-07, "epoch": 18.42577124401381, "percentage": 92.13, "elapsed_time": "16:41:06", "remaining_time": "1:25:31", "throughput": 3349.35, "total_tokens": 201182544} +{"current_steps": 165450, "total_steps": 179580, "loss": 0.8589, "lr": 9.371785600835098e-07, "epoch": 18.42632809889743, "percentage": 92.13, "elapsed_time": "16:41:07", "remaining_time": "1:25:30", "throughput": 3349.35, "total_tokens": 201188560} +{"current_steps": 165455, "total_steps": 179580, "loss": 0.7507, "lr": 9.365196412306043e-07, "epoch": 18.426884953781045, "percentage": 92.13, "elapsed_time": "16:41:09", "remaining_time": "1:25:28", "throughput": 3349.36, "total_tokens": 201194416} +{"current_steps": 165460, "total_steps": 179580, "loss": 0.5986, "lr": 9.358609496765452e-07, "epoch": 18.42744180866466, "percentage": 92.14, "elapsed_time": "16:41:11", "remaining_time": "1:25:26", "throughput": 3349.36, "total_tokens": 201200592} +{"current_steps": 165465, "total_steps": 179580, "loss": 0.8985, "lr": 9.352024854275637e-07, "epoch": 18.42799866354828, "percentage": 92.14, "elapsed_time": "16:41:13", "remaining_time": "1:25:24", "throughput": 3349.36, "total_tokens": 201206704} +{"current_steps": 165470, "total_steps": 179580, "loss": 0.8029, "lr": 9.34544248489877e-07, "epoch": 18.428555518431896, "percentage": 92.14, "elapsed_time": "16:41:14", "remaining_time": "1:25:22", "throughput": 3349.37, "total_tokens": 201211856} +{"current_steps": 165475, "total_steps": 179580, "loss": 0.7338, "lr": 9.338862388696995e-07, "epoch": 18.429112373315515, "percentage": 92.15, "elapsed_time": "16:41:16", "remaining_time": "1:25:20", "throughput": 3349.37, "total_tokens": 201218128} +{"current_steps": 165480, "total_steps": 179580, "loss": 0.6727, "lr": 9.33228456573243e-07, "epoch": 18.42966922819913, "percentage": 92.15, "elapsed_time": "16:41:18", "remaining_time": "1:25:19", "throughput": 3349.37, "total_tokens": 201223952} +{"current_steps": 165485, "total_steps": 179580, "loss": 0.6863, "lr": 9.325709016067302e-07, "epoch": 18.430226083082747, "percentage": 92.15, "elapsed_time": "16:41:19", "remaining_time": "1:25:17", "throughput": 3349.38, "total_tokens": 201230160} +{"current_steps": 165490, "total_steps": 179580, "loss": 0.6886, "lr": 9.319135739763646e-07, "epoch": 18.430782937966367, "percentage": 92.15, "elapsed_time": "16:41:21", "remaining_time": "1:25:15", "throughput": 3349.38, "total_tokens": 201236592} +{"current_steps": 165495, "total_steps": 179580, "loss": 0.6536, "lr": 9.312564736883661e-07, "epoch": 18.431339792849982, "percentage": 92.16, "elapsed_time": "16:41:23", "remaining_time": "1:25:13", "throughput": 3349.39, "total_tokens": 201242768} +{"current_steps": 165500, "total_steps": 179580, "loss": 0.597, "lr": 9.30599600748927e-07, "epoch": 18.431896647733602, "percentage": 92.16, "elapsed_time": "16:41:25", "remaining_time": "1:25:11", "throughput": 3349.39, "total_tokens": 201249008} +{"current_steps": 165505, "total_steps": 179580, "loss": 0.7009, "lr": 9.299429551642591e-07, "epoch": 18.432453502617218, "percentage": 92.16, "elapsed_time": "16:41:27", "remaining_time": "1:25:09", "throughput": 3349.4, "total_tokens": 201255408} +{"current_steps": 165510, "total_steps": 179580, "loss": 0.5845, "lr": 9.292865369405656e-07, "epoch": 18.433010357500834, "percentage": 92.17, "elapsed_time": "16:41:28", "remaining_time": "1:25:08", "throughput": 3349.4, "total_tokens": 201261328} +{"current_steps": 165515, "total_steps": 179580, "loss": 0.7443, "lr": 9.286303460840446e-07, "epoch": 18.433567212384453, "percentage": 92.17, "elapsed_time": "16:41:30", "remaining_time": "1:25:06", "throughput": 3349.4, "total_tokens": 201267632} +{"current_steps": 165520, "total_steps": 179580, "loss": 0.7301, "lr": 9.279743826008991e-07, "epoch": 18.43412406726807, "percentage": 92.17, "elapsed_time": "16:41:32", "remaining_time": "1:25:04", "throughput": 3349.4, "total_tokens": 201273904} +{"current_steps": 165525, "total_steps": 179580, "loss": 0.8178, "lr": 9.273186464973216e-07, "epoch": 18.43468092215169, "percentage": 92.17, "elapsed_time": "16:41:34", "remaining_time": "1:25:02", "throughput": 3349.41, "total_tokens": 201280176} +{"current_steps": 165530, "total_steps": 179580, "loss": 1.0046, "lr": 9.266631377795015e-07, "epoch": 18.435237777035304, "percentage": 92.18, "elapsed_time": "16:41:35", "remaining_time": "1:25:00", "throughput": 3349.41, "total_tokens": 201285744} +{"current_steps": 165535, "total_steps": 179580, "loss": 0.6026, "lr": 9.260078564536395e-07, "epoch": 18.43579463191892, "percentage": 92.18, "elapsed_time": "16:41:37", "remaining_time": "1:24:59", "throughput": 3349.41, "total_tokens": 201291440} +{"current_steps": 165540, "total_steps": 179580, "loss": 0.9536, "lr": 9.253528025259195e-07, "epoch": 18.43635148680254, "percentage": 92.18, "elapsed_time": "16:41:39", "remaining_time": "1:24:57", "throughput": 3349.41, "total_tokens": 201297200} +{"current_steps": 165545, "total_steps": 179580, "loss": 0.7115, "lr": 9.246979760025309e-07, "epoch": 18.436908341686156, "percentage": 92.18, "elapsed_time": "16:41:41", "remaining_time": "1:24:55", "throughput": 3349.42, "total_tokens": 201303472} +{"current_steps": 165550, "total_steps": 179580, "loss": 0.869, "lr": 9.240433768896578e-07, "epoch": 18.437465196569775, "percentage": 92.19, "elapsed_time": "16:41:42", "remaining_time": "1:24:53", "throughput": 3349.42, "total_tokens": 201309840} +{"current_steps": 165555, "total_steps": 179580, "loss": 0.767, "lr": 9.233890051934841e-07, "epoch": 18.43802205145339, "percentage": 92.19, "elapsed_time": "16:41:44", "remaining_time": "1:24:51", "throughput": 3349.42, "total_tokens": 201315952} +{"current_steps": 165560, "total_steps": 179580, "loss": 0.8951, "lr": 9.227348609201908e-07, "epoch": 18.438578906337007, "percentage": 92.19, "elapsed_time": "16:41:46", "remaining_time": "1:24:49", "throughput": 3349.43, "total_tokens": 201322224} +{"current_steps": 165565, "total_steps": 179580, "loss": 0.7584, "lr": 9.220809440759592e-07, "epoch": 18.439135761220626, "percentage": 92.2, "elapsed_time": "16:41:48", "remaining_time": "1:24:48", "throughput": 3349.43, "total_tokens": 201328464} +{"current_steps": 165570, "total_steps": 179580, "loss": 0.8102, "lr": 9.21427254666965e-07, "epoch": 18.439692616104242, "percentage": 92.2, "elapsed_time": "16:41:49", "remaining_time": "1:24:46", "throughput": 3349.44, "total_tokens": 201334352} +{"current_steps": 165575, "total_steps": 179580, "loss": 0.6661, "lr": 9.207737926993781e-07, "epoch": 18.44024947098786, "percentage": 92.2, "elapsed_time": "16:41:51", "remaining_time": "1:24:44", "throughput": 3349.44, "total_tokens": 201340560} +{"current_steps": 165580, "total_steps": 179580, "loss": 0.6415, "lr": 9.20120558179377e-07, "epoch": 18.440806325871478, "percentage": 92.2, "elapsed_time": "16:41:53", "remaining_time": "1:24:42", "throughput": 3349.44, "total_tokens": 201346096} +{"current_steps": 165585, "total_steps": 179580, "loss": 0.6254, "lr": 9.19467551113129e-07, "epoch": 18.441363180755094, "percentage": 92.21, "elapsed_time": "16:41:55", "remaining_time": "1:24:40", "throughput": 3349.45, "total_tokens": 201352208} +{"current_steps": 165590, "total_steps": 179580, "loss": 0.6244, "lr": 9.188147715068041e-07, "epoch": 18.441920035638713, "percentage": 92.21, "elapsed_time": "16:41:56", "remaining_time": "1:24:39", "throughput": 3349.45, "total_tokens": 201357872} +{"current_steps": 165595, "total_steps": 179580, "loss": 0.7871, "lr": 9.181622193665668e-07, "epoch": 18.44247689052233, "percentage": 92.21, "elapsed_time": "16:41:58", "remaining_time": "1:24:37", "throughput": 3349.45, "total_tokens": 201363824} +{"current_steps": 165600, "total_steps": 179580, "loss": 1.0227, "lr": 9.175098946985789e-07, "epoch": 18.44303374540595, "percentage": 92.22, "elapsed_time": "16:42:00", "remaining_time": "1:24:35", "throughput": 3349.45, "total_tokens": 201369296} +{"current_steps": 165605, "total_steps": 179580, "loss": 0.8538, "lr": 9.168577975090076e-07, "epoch": 18.443590600289564, "percentage": 92.22, "elapsed_time": "16:42:01", "remaining_time": "1:24:33", "throughput": 3349.46, "total_tokens": 201375536} +{"current_steps": 165610, "total_steps": 179580, "loss": 0.6041, "lr": 9.162059278040063e-07, "epoch": 18.44414745517318, "percentage": 92.22, "elapsed_time": "16:42:03", "remaining_time": "1:24:31", "throughput": 3349.46, "total_tokens": 201382032} +{"current_steps": 165615, "total_steps": 179580, "loss": 0.8351, "lr": 9.155542855897425e-07, "epoch": 18.4447043100568, "percentage": 92.22, "elapsed_time": "16:42:05", "remaining_time": "1:24:29", "throughput": 3349.46, "total_tokens": 201388336} +{"current_steps": 165620, "total_steps": 179580, "loss": 0.7142, "lr": 9.149028708723583e-07, "epoch": 18.445261164940415, "percentage": 92.23, "elapsed_time": "16:42:07", "remaining_time": "1:24:28", "throughput": 3349.47, "total_tokens": 201394192} +{"current_steps": 165625, "total_steps": 179580, "loss": 0.5781, "lr": 9.142516836580156e-07, "epoch": 18.445818019824035, "percentage": 92.23, "elapsed_time": "16:42:09", "remaining_time": "1:24:26", "throughput": 3349.47, "total_tokens": 201400400} +{"current_steps": 165630, "total_steps": 179580, "loss": 1.0014, "lr": 9.136007239528593e-07, "epoch": 18.44637487470765, "percentage": 92.23, "elapsed_time": "16:42:10", "remaining_time": "1:24:24", "throughput": 3349.47, "total_tokens": 201406416} +{"current_steps": 165635, "total_steps": 179580, "loss": 0.4915, "lr": 9.129499917630458e-07, "epoch": 18.44693172959127, "percentage": 92.23, "elapsed_time": "16:42:12", "remaining_time": "1:24:22", "throughput": 3349.48, "total_tokens": 201412784} +{"current_steps": 165640, "total_steps": 179580, "loss": 0.7118, "lr": 9.122994870947171e-07, "epoch": 18.447488584474886, "percentage": 92.24, "elapsed_time": "16:42:14", "remaining_time": "1:24:20", "throughput": 3349.48, "total_tokens": 201418960} +{"current_steps": 165645, "total_steps": 179580, "loss": 0.7406, "lr": 9.116492099540186e-07, "epoch": 18.448045439358502, "percentage": 92.24, "elapsed_time": "16:42:16", "remaining_time": "1:24:18", "throughput": 3349.48, "total_tokens": 201425040} +{"current_steps": 165650, "total_steps": 179580, "loss": 0.923, "lr": 9.109991603470896e-07, "epoch": 18.44860229424212, "percentage": 92.24, "elapsed_time": "16:42:17", "remaining_time": "1:24:17", "throughput": 3349.49, "total_tokens": 201431024} +{"current_steps": 165655, "total_steps": 179580, "loss": 0.4217, "lr": 9.103493382800781e-07, "epoch": 18.449159149125737, "percentage": 92.25, "elapsed_time": "16:42:19", "remaining_time": "1:24:15", "throughput": 3349.49, "total_tokens": 201437168} +{"current_steps": 165660, "total_steps": 179580, "loss": 0.6996, "lr": 9.096997437591153e-07, "epoch": 18.449716004009357, "percentage": 92.25, "elapsed_time": "16:42:21", "remaining_time": "1:24:13", "throughput": 3349.49, "total_tokens": 201443568} +{"current_steps": 165665, "total_steps": 179580, "loss": 0.9125, "lr": 9.090503767903408e-07, "epoch": 18.450272858892973, "percentage": 92.25, "elapsed_time": "16:42:23", "remaining_time": "1:24:11", "throughput": 3349.5, "total_tokens": 201449968} +{"current_steps": 165670, "total_steps": 179580, "loss": 0.6973, "lr": 9.084012373798828e-07, "epoch": 18.45082971377659, "percentage": 92.25, "elapsed_time": "16:42:25", "remaining_time": "1:24:09", "throughput": 3349.5, "total_tokens": 201455856} +{"current_steps": 165675, "total_steps": 179580, "loss": 0.6083, "lr": 9.077523255338783e-07, "epoch": 18.451386568660208, "percentage": 92.26, "elapsed_time": "16:42:26", "remaining_time": "1:24:08", "throughput": 3349.5, "total_tokens": 201461744} +{"current_steps": 165680, "total_steps": 179580, "loss": 0.6654, "lr": 9.071036412584555e-07, "epoch": 18.451943423543824, "percentage": 92.26, "elapsed_time": "16:42:28", "remaining_time": "1:24:06", "throughput": 3349.51, "total_tokens": 201467888} +{"current_steps": 165685, "total_steps": 179580, "loss": 0.5592, "lr": 9.064551845597457e-07, "epoch": 18.452500278427443, "percentage": 92.26, "elapsed_time": "16:42:30", "remaining_time": "1:24:04", "throughput": 3349.51, "total_tokens": 201474160} +{"current_steps": 165690, "total_steps": 179580, "loss": 0.7249, "lr": 9.058069554438664e-07, "epoch": 18.45305713331106, "percentage": 92.27, "elapsed_time": "16:42:32", "remaining_time": "1:24:02", "throughput": 3349.51, "total_tokens": 201480368} +{"current_steps": 165695, "total_steps": 179580, "loss": 0.6396, "lr": 9.051589539169458e-07, "epoch": 18.453613988194675, "percentage": 92.27, "elapsed_time": "16:42:33", "remaining_time": "1:24:00", "throughput": 3349.52, "total_tokens": 201486576} +{"current_steps": 165700, "total_steps": 179580, "loss": 0.5198, "lr": 9.045111799850986e-07, "epoch": 18.454170843078295, "percentage": 92.27, "elapsed_time": "16:42:35", "remaining_time": "1:23:58", "throughput": 3349.52, "total_tokens": 201492880} +{"current_steps": 165705, "total_steps": 179580, "loss": 0.7905, "lr": 9.038636336544532e-07, "epoch": 18.45472769796191, "percentage": 92.27, "elapsed_time": "16:42:37", "remaining_time": "1:23:57", "throughput": 3349.53, "total_tokens": 201498672} +{"current_steps": 165710, "total_steps": 179580, "loss": 0.8523, "lr": 9.032163149311213e-07, "epoch": 18.45528455284553, "percentage": 92.28, "elapsed_time": "16:42:39", "remaining_time": "1:23:55", "throughput": 3349.53, "total_tokens": 201504720} +{"current_steps": 165715, "total_steps": 179580, "loss": 0.7761, "lr": 9.025692238212174e-07, "epoch": 18.455841407729146, "percentage": 92.28, "elapsed_time": "16:42:40", "remaining_time": "1:23:53", "throughput": 3349.53, "total_tokens": 201511024} +{"current_steps": 165720, "total_steps": 179580, "loss": 0.7717, "lr": 9.019223603308508e-07, "epoch": 18.456398262612762, "percentage": 92.28, "elapsed_time": "16:42:42", "remaining_time": "1:23:51", "throughput": 3349.53, "total_tokens": 201517072} +{"current_steps": 165725, "total_steps": 179580, "loss": 0.7581, "lr": 9.012757244661385e-07, "epoch": 18.45695511749638, "percentage": 92.28, "elapsed_time": "16:42:44", "remaining_time": "1:23:49", "throughput": 3349.54, "total_tokens": 201523344} +{"current_steps": 165730, "total_steps": 179580, "loss": 0.6724, "lr": 9.006293162331813e-07, "epoch": 18.457511972379997, "percentage": 92.29, "elapsed_time": "16:42:46", "remaining_time": "1:23:48", "throughput": 3349.54, "total_tokens": 201529264} +{"current_steps": 165735, "total_steps": 179580, "loss": 0.5789, "lr": 8.999831356380911e-07, "epoch": 18.458068827263617, "percentage": 92.29, "elapsed_time": "16:42:47", "remaining_time": "1:23:46", "throughput": 3349.54, "total_tokens": 201535280} +{"current_steps": 165740, "total_steps": 179580, "loss": 0.7848, "lr": 8.993371826869656e-07, "epoch": 18.458625682147233, "percentage": 92.29, "elapsed_time": "16:42:49", "remaining_time": "1:23:44", "throughput": 3349.55, "total_tokens": 201541712} +{"current_steps": 165745, "total_steps": 179580, "loss": 0.824, "lr": 8.986914573859112e-07, "epoch": 18.45918253703085, "percentage": 92.3, "elapsed_time": "16:42:51", "remaining_time": "1:23:42", "throughput": 3349.55, "total_tokens": 201548048} +{"current_steps": 165750, "total_steps": 179580, "loss": 0.6373, "lr": 8.980459597410257e-07, "epoch": 18.459739391914468, "percentage": 92.3, "elapsed_time": "16:42:53", "remaining_time": "1:23:40", "throughput": 3349.56, "total_tokens": 201554000} +{"current_steps": 165755, "total_steps": 179580, "loss": 0.811, "lr": 8.97400689758407e-07, "epoch": 18.460296246798084, "percentage": 92.3, "elapsed_time": "16:42:55", "remaining_time": "1:23:38", "throughput": 3349.56, "total_tokens": 201560144} +{"current_steps": 165760, "total_steps": 179580, "loss": 0.5964, "lr": 8.967556474441474e-07, "epoch": 18.460853101681703, "percentage": 92.3, "elapsed_time": "16:42:56", "remaining_time": "1:23:37", "throughput": 3349.56, "total_tokens": 201566192} +{"current_steps": 165765, "total_steps": 179580, "loss": 0.7043, "lr": 8.961108328043449e-07, "epoch": 18.46140995656532, "percentage": 92.31, "elapsed_time": "16:42:58", "remaining_time": "1:23:35", "throughput": 3349.56, "total_tokens": 201572016} +{"current_steps": 165770, "total_steps": 179580, "loss": 0.7906, "lr": 8.954662458450864e-07, "epoch": 18.461966811448935, "percentage": 92.31, "elapsed_time": "16:43:00", "remaining_time": "1:23:33", "throughput": 3349.57, "total_tokens": 201578256} +{"current_steps": 165775, "total_steps": 179580, "loss": 0.6454, "lr": 8.948218865724584e-07, "epoch": 18.462523666332554, "percentage": 92.31, "elapsed_time": "16:43:02", "remaining_time": "1:23:31", "throughput": 3349.57, "total_tokens": 201584432} +{"current_steps": 165780, "total_steps": 179580, "loss": 0.6179, "lr": 8.941777549925535e-07, "epoch": 18.46308052121617, "percentage": 92.32, "elapsed_time": "16:43:04", "remaining_time": "1:23:29", "throughput": 3349.57, "total_tokens": 201590800} +{"current_steps": 165785, "total_steps": 179580, "loss": 0.7312, "lr": 8.935338511114527e-07, "epoch": 18.46363737609979, "percentage": 92.32, "elapsed_time": "16:43:05", "remaining_time": "1:23:28", "throughput": 3349.58, "total_tokens": 201597072} +{"current_steps": 165790, "total_steps": 179580, "loss": 0.6522, "lr": 8.928901749352376e-07, "epoch": 18.464194230983406, "percentage": 92.32, "elapsed_time": "16:43:07", "remaining_time": "1:23:26", "throughput": 3349.58, "total_tokens": 201603056} +{"current_steps": 165795, "total_steps": 179580, "loss": 0.5798, "lr": 8.92246726469989e-07, "epoch": 18.46475108586702, "percentage": 92.32, "elapsed_time": "16:43:09", "remaining_time": "1:23:24", "throughput": 3349.58, "total_tokens": 201609136} +{"current_steps": 165800, "total_steps": 179580, "loss": 0.8652, "lr": 8.916035057217859e-07, "epoch": 18.46530794075064, "percentage": 92.33, "elapsed_time": "16:43:11", "remaining_time": "1:23:22", "throughput": 3349.59, "total_tokens": 201615696} +{"current_steps": 165805, "total_steps": 179580, "loss": 0.7022, "lr": 8.909605126967036e-07, "epoch": 18.465864795634257, "percentage": 92.33, "elapsed_time": "16:43:12", "remaining_time": "1:23:20", "throughput": 3349.59, "total_tokens": 201621552} +{"current_steps": 165810, "total_steps": 179580, "loss": 0.521, "lr": 8.903177474008151e-07, "epoch": 18.466421650517876, "percentage": 92.33, "elapsed_time": "16:43:14", "remaining_time": "1:23:18", "throughput": 3349.59, "total_tokens": 201627440} +{"current_steps": 165815, "total_steps": 179580, "loss": 0.6626, "lr": 8.896752098401879e-07, "epoch": 18.466978505401492, "percentage": 92.33, "elapsed_time": "16:43:16", "remaining_time": "1:23:17", "throughput": 3349.59, "total_tokens": 201633488} +{"current_steps": 165820, "total_steps": 179580, "loss": 0.6349, "lr": 8.890329000208975e-07, "epoch": 18.46753536028511, "percentage": 92.34, "elapsed_time": "16:43:18", "remaining_time": "1:23:15", "throughput": 3349.6, "total_tokens": 201639184} +{"current_steps": 165825, "total_steps": 179580, "loss": 0.9211, "lr": 8.883908179490086e-07, "epoch": 18.468092215168728, "percentage": 92.34, "elapsed_time": "16:43:19", "remaining_time": "1:23:13", "throughput": 3349.6, "total_tokens": 201645264} +{"current_steps": 165830, "total_steps": 179580, "loss": 0.8108, "lr": 8.877489636305885e-07, "epoch": 18.468649070052344, "percentage": 92.34, "elapsed_time": "16:43:21", "remaining_time": "1:23:11", "throughput": 3349.6, "total_tokens": 201651568} +{"current_steps": 165835, "total_steps": 179580, "loss": 0.5966, "lr": 8.871073370716937e-07, "epoch": 18.469205924935963, "percentage": 92.35, "elapsed_time": "16:43:23", "remaining_time": "1:23:09", "throughput": 3349.61, "total_tokens": 201657712} +{"current_steps": 165840, "total_steps": 179580, "loss": 0.4765, "lr": 8.864659382783941e-07, "epoch": 18.46976277981958, "percentage": 92.35, "elapsed_time": "16:43:25", "remaining_time": "1:23:08", "throughput": 3349.61, "total_tokens": 201663952} +{"current_steps": 165845, "total_steps": 179580, "loss": 0.6043, "lr": 8.858247672567377e-07, "epoch": 18.470319634703195, "percentage": 92.35, "elapsed_time": "16:43:27", "remaining_time": "1:23:06", "throughput": 3349.61, "total_tokens": 201670352} +{"current_steps": 165850, "total_steps": 179580, "loss": 0.746, "lr": 8.851838240127891e-07, "epoch": 18.470876489586814, "percentage": 92.35, "elapsed_time": "16:43:28", "remaining_time": "1:23:04", "throughput": 3349.62, "total_tokens": 201676304} +{"current_steps": 165855, "total_steps": 179580, "loss": 0.8116, "lr": 8.845431085526018e-07, "epoch": 18.47143334447043, "percentage": 92.36, "elapsed_time": "16:43:30", "remaining_time": "1:23:02", "throughput": 3349.62, "total_tokens": 201682384} +{"current_steps": 165860, "total_steps": 179580, "loss": 0.6195, "lr": 8.839026208822238e-07, "epoch": 18.47199019935405, "percentage": 92.36, "elapsed_time": "16:43:32", "remaining_time": "1:23:00", "throughput": 3349.62, "total_tokens": 201688400} +{"current_steps": 165865, "total_steps": 179580, "loss": 0.5842, "lr": 8.832623610077057e-07, "epoch": 18.472547054237666, "percentage": 92.36, "elapsed_time": "16:43:34", "remaining_time": "1:22:58", "throughput": 3349.63, "total_tokens": 201694448} +{"current_steps": 165870, "total_steps": 179580, "loss": 0.7599, "lr": 8.826223289350982e-07, "epoch": 18.47310390912128, "percentage": 92.37, "elapsed_time": "16:43:35", "remaining_time": "1:22:57", "throughput": 3349.63, "total_tokens": 201700176} +{"current_steps": 165875, "total_steps": 179580, "loss": 1.0142, "lr": 8.819825246704466e-07, "epoch": 18.4736607640049, "percentage": 92.37, "elapsed_time": "16:43:37", "remaining_time": "1:22:55", "throughput": 3349.63, "total_tokens": 201706032} +{"current_steps": 165880, "total_steps": 179580, "loss": 0.7609, "lr": 8.813429482197933e-07, "epoch": 18.474217618888517, "percentage": 92.37, "elapsed_time": "16:43:39", "remaining_time": "1:22:53", "throughput": 3349.63, "total_tokens": 201711856} +{"current_steps": 165885, "total_steps": 179580, "loss": 0.6603, "lr": 8.80703599589175e-07, "epoch": 18.474774473772136, "percentage": 92.37, "elapsed_time": "16:43:40", "remaining_time": "1:22:51", "throughput": 3349.64, "total_tokens": 201717808} +{"current_steps": 165890, "total_steps": 179580, "loss": 0.6841, "lr": 8.800644787846396e-07, "epoch": 18.475331328655752, "percentage": 92.38, "elapsed_time": "16:43:42", "remaining_time": "1:22:49", "throughput": 3349.64, "total_tokens": 201723888} +{"current_steps": 165895, "total_steps": 179580, "loss": 0.7384, "lr": 8.794255858122158e-07, "epoch": 18.475888183539368, "percentage": 92.38, "elapsed_time": "16:43:44", "remaining_time": "1:22:48", "throughput": 3349.64, "total_tokens": 201730128} +{"current_steps": 165900, "total_steps": 179580, "loss": 0.909, "lr": 8.787869206779487e-07, "epoch": 18.476445038422987, "percentage": 92.38, "elapsed_time": "16:43:46", "remaining_time": "1:22:46", "throughput": 3349.65, "total_tokens": 201736144} +{"current_steps": 165905, "total_steps": 179580, "loss": 0.5388, "lr": 8.781484833878584e-07, "epoch": 18.477001893306603, "percentage": 92.39, "elapsed_time": "16:43:47", "remaining_time": "1:22:44", "throughput": 3349.65, "total_tokens": 201742256} +{"current_steps": 165910, "total_steps": 179580, "loss": 0.8444, "lr": 8.775102739479846e-07, "epoch": 18.477558748190223, "percentage": 92.39, "elapsed_time": "16:43:49", "remaining_time": "1:22:42", "throughput": 3349.65, "total_tokens": 201748464} +{"current_steps": 165915, "total_steps": 179580, "loss": 0.9202, "lr": 8.768722923643502e-07, "epoch": 18.47811560307384, "percentage": 92.39, "elapsed_time": "16:43:51", "remaining_time": "1:22:40", "throughput": 3349.66, "total_tokens": 201754768} +{"current_steps": 165920, "total_steps": 179580, "loss": 0.862, "lr": 8.762345386429865e-07, "epoch": 18.478672457957455, "percentage": 92.39, "elapsed_time": "16:43:53", "remaining_time": "1:22:38", "throughput": 3349.66, "total_tokens": 201760688} +{"current_steps": 165925, "total_steps": 179580, "loss": 0.9444, "lr": 8.755970127899166e-07, "epoch": 18.479229312841074, "percentage": 92.4, "elapsed_time": "16:43:54", "remaining_time": "1:22:37", "throughput": 3349.66, "total_tokens": 201766608} +{"current_steps": 165930, "total_steps": 179580, "loss": 0.7059, "lr": 8.749597148111604e-07, "epoch": 18.47978616772469, "percentage": 92.4, "elapsed_time": "16:43:56", "remaining_time": "1:22:35", "throughput": 3349.67, "total_tokens": 201773136} +{"current_steps": 165935, "total_steps": 179580, "loss": 0.6481, "lr": 8.743226447127356e-07, "epoch": 18.48034302260831, "percentage": 92.4, "elapsed_time": "16:43:58", "remaining_time": "1:22:33", "throughput": 3349.67, "total_tokens": 201779696} +{"current_steps": 165940, "total_steps": 179580, "loss": 0.7952, "lr": 8.73685802500665e-07, "epoch": 18.480899877491925, "percentage": 92.4, "elapsed_time": "16:44:00", "remaining_time": "1:22:31", "throughput": 3349.68, "total_tokens": 201785744} +{"current_steps": 165945, "total_steps": 179580, "loss": 0.6882, "lr": 8.730491881809633e-07, "epoch": 18.48145673237554, "percentage": 92.41, "elapsed_time": "16:44:02", "remaining_time": "1:22:29", "throughput": 3349.68, "total_tokens": 201791920} +{"current_steps": 165950, "total_steps": 179580, "loss": 0.6737, "lr": 8.724128017596394e-07, "epoch": 18.48201358725916, "percentage": 92.41, "elapsed_time": "16:44:03", "remaining_time": "1:22:28", "throughput": 3349.68, "total_tokens": 201797744} +{"current_steps": 165955, "total_steps": 179580, "loss": 0.7825, "lr": 8.717766432427055e-07, "epoch": 18.482570442142777, "percentage": 92.41, "elapsed_time": "16:44:05", "remaining_time": "1:22:26", "throughput": 3349.69, "total_tokens": 201803728} +{"current_steps": 165960, "total_steps": 179580, "loss": 0.7898, "lr": 8.711407126361759e-07, "epoch": 18.483127297026396, "percentage": 92.42, "elapsed_time": "16:44:07", "remaining_time": "1:22:24", "throughput": 3349.69, "total_tokens": 201809552} +{"current_steps": 165965, "total_steps": 179580, "loss": 0.8185, "lr": 8.705050099460516e-07, "epoch": 18.483684151910012, "percentage": 92.42, "elapsed_time": "16:44:08", "remaining_time": "1:22:22", "throughput": 3349.69, "total_tokens": 201814896} +{"current_steps": 165970, "total_steps": 179580, "loss": 0.7498, "lr": 8.698695351783415e-07, "epoch": 18.48424100679363, "percentage": 92.42, "elapsed_time": "16:44:10", "remaining_time": "1:22:20", "throughput": 3349.69, "total_tokens": 201821040} +{"current_steps": 165975, "total_steps": 179580, "loss": 0.6575, "lr": 8.692342883390464e-07, "epoch": 18.484797861677247, "percentage": 92.42, "elapsed_time": "16:44:12", "remaining_time": "1:22:18", "throughput": 3349.69, "total_tokens": 201826992} +{"current_steps": 165980, "total_steps": 179580, "loss": 0.7058, "lr": 8.685992694341671e-07, "epoch": 18.485354716560863, "percentage": 92.43, "elapsed_time": "16:44:14", "remaining_time": "1:22:17", "throughput": 3349.7, "total_tokens": 201833104} +{"current_steps": 165985, "total_steps": 179580, "loss": 0.6375, "lr": 8.679644784696988e-07, "epoch": 18.485911571444483, "percentage": 92.43, "elapsed_time": "16:44:15", "remaining_time": "1:22:15", "throughput": 3349.7, "total_tokens": 201839088} +{"current_steps": 165990, "total_steps": 179580, "loss": 0.7494, "lr": 8.673299154516423e-07, "epoch": 18.4864684263281, "percentage": 92.43, "elapsed_time": "16:44:17", "remaining_time": "1:22:13", "throughput": 3349.7, "total_tokens": 201844784} +{"current_steps": 165995, "total_steps": 179580, "loss": 0.6697, "lr": 8.666955803859928e-07, "epoch": 18.487025281211718, "percentage": 92.44, "elapsed_time": "16:44:19", "remaining_time": "1:22:11", "throughput": 3349.71, "total_tokens": 201850928} +{"current_steps": 166000, "total_steps": 179580, "loss": 0.8535, "lr": 8.660614732787343e-07, "epoch": 18.487582136095334, "percentage": 92.44, "elapsed_time": "16:44:21", "remaining_time": "1:22:09", "throughput": 3349.71, "total_tokens": 201857136} +{"current_steps": 166005, "total_steps": 179580, "loss": 0.7788, "lr": 8.654275941358592e-07, "epoch": 18.48813899097895, "percentage": 92.44, "elapsed_time": "16:44:22", "remaining_time": "1:22:07", "throughput": 3349.71, "total_tokens": 201862768} +{"current_steps": 166010, "total_steps": 179580, "loss": 0.6329, "lr": 8.647939429633628e-07, "epoch": 18.48869584586257, "percentage": 92.44, "elapsed_time": "16:44:24", "remaining_time": "1:22:06", "throughput": 3349.72, "total_tokens": 201868944} +{"current_steps": 166015, "total_steps": 179580, "loss": 0.8103, "lr": 8.641605197672182e-07, "epoch": 18.489252700746185, "percentage": 92.45, "elapsed_time": "16:44:26", "remaining_time": "1:22:04", "throughput": 3349.72, "total_tokens": 201875248} +{"current_steps": 166020, "total_steps": 179580, "loss": 0.8894, "lr": 8.635273245534203e-07, "epoch": 18.489809555629805, "percentage": 92.45, "elapsed_time": "16:44:28", "remaining_time": "1:22:02", "throughput": 3349.72, "total_tokens": 201881520} +{"current_steps": 166025, "total_steps": 179580, "loss": 0.7363, "lr": 8.628943573279425e-07, "epoch": 18.49036641051342, "percentage": 92.45, "elapsed_time": "16:44:29", "remaining_time": "1:22:00", "throughput": 3349.73, "total_tokens": 201887568} +{"current_steps": 166030, "total_steps": 179580, "loss": 0.8024, "lr": 8.622616180967658e-07, "epoch": 18.490923265397036, "percentage": 92.45, "elapsed_time": "16:44:31", "remaining_time": "1:21:58", "throughput": 3349.73, "total_tokens": 201894000} +{"current_steps": 166035, "total_steps": 179580, "loss": 0.6818, "lr": 8.616291068658633e-07, "epoch": 18.491480120280656, "percentage": 92.46, "elapsed_time": "16:44:33", "remaining_time": "1:21:57", "throughput": 3349.74, "total_tokens": 201900272} +{"current_steps": 166040, "total_steps": 179580, "loss": 0.8191, "lr": 8.609968236412163e-07, "epoch": 18.49203697516427, "percentage": 92.46, "elapsed_time": "16:44:35", "remaining_time": "1:21:55", "throughput": 3349.74, "total_tokens": 201905872} +{"current_steps": 166045, "total_steps": 179580, "loss": 0.4604, "lr": 8.603647684287952e-07, "epoch": 18.49259383004789, "percentage": 92.46, "elapsed_time": "16:44:36", "remaining_time": "1:21:53", "throughput": 3349.74, "total_tokens": 201912336} +{"current_steps": 166050, "total_steps": 179580, "loss": 0.7698, "lr": 8.597329412345701e-07, "epoch": 18.493150684931507, "percentage": 92.47, "elapsed_time": "16:44:38", "remaining_time": "1:21:51", "throughput": 3349.75, "total_tokens": 201918160} +{"current_steps": 166055, "total_steps": 179580, "loss": 0.4754, "lr": 8.591013420645055e-07, "epoch": 18.493707539815123, "percentage": 92.47, "elapsed_time": "16:44:40", "remaining_time": "1:21:49", "throughput": 3349.75, "total_tokens": 201924400} +{"current_steps": 166060, "total_steps": 179580, "loss": 0.7103, "lr": 8.58469970924572e-07, "epoch": 18.494264394698742, "percentage": 92.47, "elapsed_time": "16:44:42", "remaining_time": "1:21:47", "throughput": 3349.75, "total_tokens": 201930640} +{"current_steps": 166065, "total_steps": 179580, "loss": 0.6762, "lr": 8.578388278207311e-07, "epoch": 18.49482124958236, "percentage": 92.47, "elapsed_time": "16:44:44", "remaining_time": "1:21:46", "throughput": 3349.76, "total_tokens": 201936752} +{"current_steps": 166070, "total_steps": 179580, "loss": 0.66, "lr": 8.572079127589449e-07, "epoch": 18.495378104465978, "percentage": 92.48, "elapsed_time": "16:44:45", "remaining_time": "1:21:44", "throughput": 3349.76, "total_tokens": 201942224} +{"current_steps": 166075, "total_steps": 179580, "loss": 0.7978, "lr": 8.565772257451699e-07, "epoch": 18.495934959349594, "percentage": 92.48, "elapsed_time": "16:44:47", "remaining_time": "1:21:42", "throughput": 3349.76, "total_tokens": 201948592} +{"current_steps": 166080, "total_steps": 179580, "loss": 0.9568, "lr": 8.559467667853705e-07, "epoch": 18.49649181423321, "percentage": 92.48, "elapsed_time": "16:44:49", "remaining_time": "1:21:40", "throughput": 3349.76, "total_tokens": 201954640} +{"current_steps": 166085, "total_steps": 179580, "loss": 0.6251, "lr": 8.553165358854947e-07, "epoch": 18.49704866911683, "percentage": 92.49, "elapsed_time": "16:44:50", "remaining_time": "1:21:38", "throughput": 3349.77, "total_tokens": 201960656} +{"current_steps": 166090, "total_steps": 179580, "loss": 0.6627, "lr": 8.546865330515019e-07, "epoch": 18.497605524000445, "percentage": 92.49, "elapsed_time": "16:44:52", "remaining_time": "1:21:37", "throughput": 3349.77, "total_tokens": 201966416} +{"current_steps": 166095, "total_steps": 179580, "loss": 0.727, "lr": 8.540567582893372e-07, "epoch": 18.498162378884064, "percentage": 92.49, "elapsed_time": "16:44:54", "remaining_time": "1:21:35", "throughput": 3349.77, "total_tokens": 201972496} +{"current_steps": 166100, "total_steps": 179580, "loss": 0.5124, "lr": 8.534272116049513e-07, "epoch": 18.49871923376768, "percentage": 92.49, "elapsed_time": "16:44:56", "remaining_time": "1:21:33", "throughput": 3349.78, "total_tokens": 201978416} +{"current_steps": 166105, "total_steps": 179580, "loss": 0.472, "lr": 8.527978930042923e-07, "epoch": 18.499276088651296, "percentage": 92.5, "elapsed_time": "16:44:57", "remaining_time": "1:21:31", "throughput": 3349.78, "total_tokens": 201984880} +{"current_steps": 166110, "total_steps": 179580, "loss": 0.5182, "lr": 8.521688024933028e-07, "epoch": 18.499832943534916, "percentage": 92.5, "elapsed_time": "16:44:59", "remaining_time": "1:21:29", "throughput": 3349.78, "total_tokens": 201990960} +{"current_steps": 166115, "total_steps": 179580, "loss": 0.7264, "lr": 8.515399400779278e-07, "epoch": 18.50038979841853, "percentage": 92.5, "elapsed_time": "16:45:01", "remaining_time": "1:21:27", "throughput": 3349.79, "total_tokens": 201997264} +{"current_steps": 166120, "total_steps": 179580, "loss": 0.7209, "lr": 8.509113057641072e-07, "epoch": 18.50094665330215, "percentage": 92.5, "elapsed_time": "16:45:03", "remaining_time": "1:21:26", "throughput": 3349.79, "total_tokens": 202003440} +{"current_steps": 166125, "total_steps": 179580, "loss": 0.9238, "lr": 8.502828995577722e-07, "epoch": 18.501503508185767, "percentage": 92.51, "elapsed_time": "16:45:05", "remaining_time": "1:21:24", "throughput": 3349.79, "total_tokens": 202009584} +{"current_steps": 166130, "total_steps": 179580, "loss": 0.6253, "lr": 8.496547214648654e-07, "epoch": 18.502060363069383, "percentage": 92.51, "elapsed_time": "16:45:06", "remaining_time": "1:21:22", "throughput": 3349.8, "total_tokens": 202015728} +{"current_steps": 166135, "total_steps": 179580, "loss": 0.6452, "lr": 8.490267714913208e-07, "epoch": 18.502617217953002, "percentage": 92.51, "elapsed_time": "16:45:08", "remaining_time": "1:21:20", "throughput": 3349.8, "total_tokens": 202021968} +{"current_steps": 166140, "total_steps": 179580, "loss": 0.6432, "lr": 8.483990496430671e-07, "epoch": 18.503174072836618, "percentage": 92.52, "elapsed_time": "16:45:10", "remaining_time": "1:21:18", "throughput": 3349.81, "total_tokens": 202028208} +{"current_steps": 166145, "total_steps": 179580, "loss": 0.745, "lr": 8.477715559260302e-07, "epoch": 18.503730927720238, "percentage": 92.52, "elapsed_time": "16:45:12", "remaining_time": "1:21:17", "throughput": 3349.81, "total_tokens": 202033968} +{"current_steps": 166150, "total_steps": 179580, "loss": 0.8252, "lr": 8.471442903461468e-07, "epoch": 18.504287782603853, "percentage": 92.52, "elapsed_time": "16:45:13", "remaining_time": "1:21:15", "throughput": 3349.81, "total_tokens": 202040272} +{"current_steps": 166155, "total_steps": 179580, "loss": 0.9906, "lr": 8.465172529093318e-07, "epoch": 18.50484463748747, "percentage": 92.52, "elapsed_time": "16:45:15", "remaining_time": "1:21:13", "throughput": 3349.82, "total_tokens": 202046608} +{"current_steps": 166160, "total_steps": 179580, "loss": 0.8481, "lr": 8.458904436215164e-07, "epoch": 18.50540149237109, "percentage": 92.53, "elapsed_time": "16:45:17", "remaining_time": "1:21:11", "throughput": 3349.82, "total_tokens": 202052912} +{"current_steps": 166165, "total_steps": 179580, "loss": 0.606, "lr": 8.452638624886183e-07, "epoch": 18.505958347254705, "percentage": 92.53, "elapsed_time": "16:45:19", "remaining_time": "1:21:09", "throughput": 3349.83, "total_tokens": 202059280} +{"current_steps": 166170, "total_steps": 179580, "loss": 0.6042, "lr": 8.446375095165548e-07, "epoch": 18.506515202138324, "percentage": 92.53, "elapsed_time": "16:45:21", "remaining_time": "1:21:07", "throughput": 3349.83, "total_tokens": 202065616} +{"current_steps": 166175, "total_steps": 179580, "loss": 0.8633, "lr": 8.44011384711238e-07, "epoch": 18.50707205702194, "percentage": 92.54, "elapsed_time": "16:45:22", "remaining_time": "1:21:06", "throughput": 3349.84, "total_tokens": 202071856} +{"current_steps": 166180, "total_steps": 179580, "loss": 0.6966, "lr": 8.433854880785936e-07, "epoch": 18.507628911905556, "percentage": 92.54, "elapsed_time": "16:45:24", "remaining_time": "1:21:04", "throughput": 3349.84, "total_tokens": 202077840} +{"current_steps": 166185, "total_steps": 179580, "loss": 0.6501, "lr": 8.427598196245251e-07, "epoch": 18.508185766789175, "percentage": 92.54, "elapsed_time": "16:45:26", "remaining_time": "1:21:02", "throughput": 3349.84, "total_tokens": 202084144} +{"current_steps": 166190, "total_steps": 179580, "loss": 0.5917, "lr": 8.421343793549446e-07, "epoch": 18.50874262167279, "percentage": 92.54, "elapsed_time": "16:45:28", "remaining_time": "1:21:00", "throughput": 3349.85, "total_tokens": 202090672} +{"current_steps": 166195, "total_steps": 179580, "loss": 0.7346, "lr": 8.415091672757613e-07, "epoch": 18.50929947655641, "percentage": 92.55, "elapsed_time": "16:45:30", "remaining_time": "1:20:58", "throughput": 3349.85, "total_tokens": 202096816} +{"current_steps": 166200, "total_steps": 179580, "loss": 0.491, "lr": 8.40884183392876e-07, "epoch": 18.509856331440027, "percentage": 92.55, "elapsed_time": "16:45:31", "remaining_time": "1:20:57", "throughput": 3349.85, "total_tokens": 202102768} +{"current_steps": 166205, "total_steps": 179580, "loss": 0.6144, "lr": 8.402594277121978e-07, "epoch": 18.510413186323643, "percentage": 92.55, "elapsed_time": "16:45:33", "remaining_time": "1:20:55", "throughput": 3349.85, "total_tokens": 202108816} +{"current_steps": 166210, "total_steps": 179580, "loss": 0.6896, "lr": 8.396349002396247e-07, "epoch": 18.510970041207262, "percentage": 92.55, "elapsed_time": "16:45:35", "remaining_time": "1:20:53", "throughput": 3349.86, "total_tokens": 202115120} +{"current_steps": 166215, "total_steps": 179580, "loss": 0.7813, "lr": 8.390106009810578e-07, "epoch": 18.511526896090878, "percentage": 92.56, "elapsed_time": "16:45:37", "remaining_time": "1:20:51", "throughput": 3349.86, "total_tokens": 202121808} +{"current_steps": 166220, "total_steps": 179580, "loss": 0.4116, "lr": 8.383865299423921e-07, "epoch": 18.512083750974497, "percentage": 92.56, "elapsed_time": "16:45:39", "remaining_time": "1:20:49", "throughput": 3349.87, "total_tokens": 202127952} +{"current_steps": 166225, "total_steps": 179580, "loss": 0.7802, "lr": 8.37762687129523e-07, "epoch": 18.512640605858113, "percentage": 92.56, "elapsed_time": "16:45:40", "remaining_time": "1:20:47", "throughput": 3349.86, "total_tokens": 202134064} +{"current_steps": 166230, "total_steps": 179580, "loss": 0.8791, "lr": 8.37139072548343e-07, "epoch": 18.51319746074173, "percentage": 92.57, "elapsed_time": "16:45:42", "remaining_time": "1:20:46", "throughput": 3349.86, "total_tokens": 202140240} +{"current_steps": 166235, "total_steps": 179580, "loss": 0.7289, "lr": 8.365156862047502e-07, "epoch": 18.51375431562535, "percentage": 92.57, "elapsed_time": "16:45:44", "remaining_time": "1:20:44", "throughput": 3349.87, "total_tokens": 202146096} +{"current_steps": 166240, "total_steps": 179580, "loss": 0.5093, "lr": 8.358925281046203e-07, "epoch": 18.514311170508964, "percentage": 92.57, "elapsed_time": "16:45:46", "remaining_time": "1:20:42", "throughput": 3349.87, "total_tokens": 202151952} +{"current_steps": 166245, "total_steps": 179580, "loss": 0.87, "lr": 8.35269598253846e-07, "epoch": 18.514868025392584, "percentage": 92.57, "elapsed_time": "16:45:47", "remaining_time": "1:20:40", "throughput": 3349.87, "total_tokens": 202157936} +{"current_steps": 166250, "total_steps": 179580, "loss": 0.578, "lr": 8.346468966583087e-07, "epoch": 18.5154248802762, "percentage": 92.58, "elapsed_time": "16:45:49", "remaining_time": "1:20:38", "throughput": 3349.87, "total_tokens": 202163920} +{"current_steps": 166255, "total_steps": 179580, "loss": 0.7492, "lr": 8.34024423323898e-07, "epoch": 18.515981735159816, "percentage": 92.58, "elapsed_time": "16:45:51", "remaining_time": "1:20:37", "throughput": 3349.87, "total_tokens": 202169296} +{"current_steps": 166260, "total_steps": 179580, "loss": 0.8346, "lr": 8.334021782564843e-07, "epoch": 18.516538590043435, "percentage": 92.58, "elapsed_time": "16:45:53", "remaining_time": "1:20:35", "throughput": 3349.88, "total_tokens": 202175888} +{"current_steps": 166265, "total_steps": 179580, "loss": 0.613, "lr": 8.327801614619518e-07, "epoch": 18.51709544492705, "percentage": 92.59, "elapsed_time": "16:45:54", "remaining_time": "1:20:33", "throughput": 3349.88, "total_tokens": 202181744} +{"current_steps": 166270, "total_steps": 179580, "loss": 0.5808, "lr": 8.321583729461679e-07, "epoch": 18.51765229981067, "percentage": 92.59, "elapsed_time": "16:45:56", "remaining_time": "1:20:31", "throughput": 3349.89, "total_tokens": 202187984} +{"current_steps": 166275, "total_steps": 179580, "loss": 0.6431, "lr": 8.31536812715017e-07, "epoch": 18.518209154694286, "percentage": 92.59, "elapsed_time": "16:45:58", "remaining_time": "1:20:29", "throughput": 3349.89, "total_tokens": 202194128} +{"current_steps": 166280, "total_steps": 179580, "loss": 0.7836, "lr": 8.309154807743608e-07, "epoch": 18.518766009577902, "percentage": 92.59, "elapsed_time": "16:46:00", "remaining_time": "1:20:27", "throughput": 3349.89, "total_tokens": 202199984} +{"current_steps": 166285, "total_steps": 179580, "loss": 0.7487, "lr": 8.302943771300753e-07, "epoch": 18.51932286446152, "percentage": 92.6, "elapsed_time": "16:46:01", "remaining_time": "1:20:26", "throughput": 3349.9, "total_tokens": 202205872} +{"current_steps": 166290, "total_steps": 179580, "loss": 0.5888, "lr": 8.296735017880197e-07, "epoch": 18.519879719345138, "percentage": 92.6, "elapsed_time": "16:46:03", "remaining_time": "1:20:24", "throughput": 3349.9, "total_tokens": 202212176} +{"current_steps": 166295, "total_steps": 179580, "loss": 0.7998, "lr": 8.290528547540643e-07, "epoch": 18.520436574228757, "percentage": 92.6, "elapsed_time": "16:46:05", "remaining_time": "1:20:22", "throughput": 3349.9, "total_tokens": 202218256} +{"current_steps": 166300, "total_steps": 179580, "loss": 0.7154, "lr": 8.284324360340684e-07, "epoch": 18.520993429112373, "percentage": 92.6, "elapsed_time": "16:46:07", "remaining_time": "1:20:20", "throughput": 3349.9, "total_tokens": 202224112} +{"current_steps": 166305, "total_steps": 179580, "loss": 0.666, "lr": 8.278122456338993e-07, "epoch": 18.521550283995992, "percentage": 92.61, "elapsed_time": "16:46:08", "remaining_time": "1:20:18", "throughput": 3349.91, "total_tokens": 202230384} +{"current_steps": 166310, "total_steps": 179580, "loss": 0.6842, "lr": 8.271922835594054e-07, "epoch": 18.52210713887961, "percentage": 92.61, "elapsed_time": "16:46:10", "remaining_time": "1:20:17", "throughput": 3349.91, "total_tokens": 202236496} +{"current_steps": 166315, "total_steps": 179580, "loss": 0.6615, "lr": 8.265725498164484e-07, "epoch": 18.522663993763224, "percentage": 92.61, "elapsed_time": "16:46:12", "remaining_time": "1:20:15", "throughput": 3349.92, "total_tokens": 202242768} +{"current_steps": 166320, "total_steps": 179580, "loss": 0.4751, "lr": 8.259530444108793e-07, "epoch": 18.523220848646844, "percentage": 92.62, "elapsed_time": "16:46:14", "remaining_time": "1:20:13", "throughput": 3349.92, "total_tokens": 202249040} +{"current_steps": 166325, "total_steps": 179580, "loss": 1.0801, "lr": 8.253337673485545e-07, "epoch": 18.52377770353046, "percentage": 92.62, "elapsed_time": "16:46:16", "remaining_time": "1:20:11", "throughput": 3349.93, "total_tokens": 202255088} +{"current_steps": 166330, "total_steps": 179580, "loss": 0.6927, "lr": 8.247147186353193e-07, "epoch": 18.524334558414076, "percentage": 92.62, "elapsed_time": "16:46:17", "remaining_time": "1:20:09", "throughput": 3349.93, "total_tokens": 202261392} +{"current_steps": 166335, "total_steps": 179580, "loss": 0.853, "lr": 8.240958982770247e-07, "epoch": 18.524891413297695, "percentage": 92.62, "elapsed_time": "16:46:19", "remaining_time": "1:20:07", "throughput": 3349.93, "total_tokens": 202267536} +{"current_steps": 166340, "total_steps": 179580, "loss": 0.8515, "lr": 8.234773062795104e-07, "epoch": 18.52544826818131, "percentage": 92.63, "elapsed_time": "16:46:21", "remaining_time": "1:20:06", "throughput": 3349.94, "total_tokens": 202273872} +{"current_steps": 166345, "total_steps": 179580, "loss": 0.6588, "lr": 8.228589426486244e-07, "epoch": 18.52600512306493, "percentage": 92.63, "elapsed_time": "16:46:23", "remaining_time": "1:20:04", "throughput": 3349.94, "total_tokens": 202279472} +{"current_steps": 166350, "total_steps": 179580, "loss": 0.7494, "lr": 8.222408073902066e-07, "epoch": 18.526561977948546, "percentage": 92.63, "elapsed_time": "16:46:24", "remaining_time": "1:20:02", "throughput": 3349.94, "total_tokens": 202285744} +{"current_steps": 166355, "total_steps": 179580, "loss": 0.6443, "lr": 8.216229005100967e-07, "epoch": 18.527118832832166, "percentage": 92.64, "elapsed_time": "16:46:26", "remaining_time": "1:20:00", "throughput": 3349.95, "total_tokens": 202291632} +{"current_steps": 166360, "total_steps": 179580, "loss": 0.7946, "lr": 8.210052220141262e-07, "epoch": 18.52767568771578, "percentage": 92.64, "elapsed_time": "16:46:28", "remaining_time": "1:19:58", "throughput": 3349.95, "total_tokens": 202297840} +{"current_steps": 166365, "total_steps": 179580, "loss": 0.5913, "lr": 8.203877719081349e-07, "epoch": 18.528232542599397, "percentage": 92.64, "elapsed_time": "16:46:30", "remaining_time": "1:19:57", "throughput": 3349.95, "total_tokens": 202303856} +{"current_steps": 166370, "total_steps": 179580, "loss": 0.6588, "lr": 8.197705501979514e-07, "epoch": 18.528789397483017, "percentage": 92.64, "elapsed_time": "16:46:31", "remaining_time": "1:19:55", "throughput": 3349.96, "total_tokens": 202309840} +{"current_steps": 166375, "total_steps": 179580, "loss": 0.7928, "lr": 8.191535568894127e-07, "epoch": 18.529346252366633, "percentage": 92.65, "elapsed_time": "16:46:33", "remaining_time": "1:19:53", "throughput": 3349.96, "total_tokens": 202315856} +{"current_steps": 166380, "total_steps": 179580, "loss": 0.7455, "lr": 8.185367919883391e-07, "epoch": 18.529903107250252, "percentage": 92.65, "elapsed_time": "16:46:35", "remaining_time": "1:19:51", "throughput": 3349.96, "total_tokens": 202322032} +{"current_steps": 166385, "total_steps": 179580, "loss": 0.527, "lr": 8.179202555005622e-07, "epoch": 18.530459962133868, "percentage": 92.65, "elapsed_time": "16:46:37", "remaining_time": "1:19:49", "throughput": 3349.97, "total_tokens": 202328272} +{"current_steps": 166390, "total_steps": 179580, "loss": 0.9677, "lr": 8.173039474318966e-07, "epoch": 18.531016817017484, "percentage": 92.66, "elapsed_time": "16:46:38", "remaining_time": "1:19:47", "throughput": 3349.97, "total_tokens": 202334096} +{"current_steps": 166395, "total_steps": 179580, "loss": 0.8108, "lr": 8.166878677881767e-07, "epoch": 18.531573671901103, "percentage": 92.66, "elapsed_time": "16:46:40", "remaining_time": "1:19:46", "throughput": 3349.97, "total_tokens": 202340048} +{"current_steps": 166400, "total_steps": 179580, "loss": 0.8704, "lr": 8.160720165752117e-07, "epoch": 18.53213052678472, "percentage": 92.66, "elapsed_time": "16:46:42", "remaining_time": "1:19:44", "throughput": 3349.97, "total_tokens": 202346160} +{"current_steps": 166405, "total_steps": 179580, "loss": 0.6899, "lr": 8.154563937988247e-07, "epoch": 18.53268738166834, "percentage": 92.66, "elapsed_time": "16:46:44", "remaining_time": "1:19:42", "throughput": 3349.98, "total_tokens": 202352176} +{"current_steps": 166410, "total_steps": 179580, "loss": 0.6181, "lr": 8.148409994648249e-07, "epoch": 18.533244236551955, "percentage": 92.67, "elapsed_time": "16:46:45", "remaining_time": "1:19:40", "throughput": 3349.98, "total_tokens": 202358032} +{"current_steps": 166415, "total_steps": 179580, "loss": 0.7628, "lr": 8.142258335790298e-07, "epoch": 18.53380109143557, "percentage": 92.67, "elapsed_time": "16:46:47", "remaining_time": "1:19:38", "throughput": 3349.98, "total_tokens": 202364432} +{"current_steps": 166420, "total_steps": 179580, "loss": 0.6363, "lr": 8.136108961472488e-07, "epoch": 18.53435794631919, "percentage": 92.67, "elapsed_time": "16:46:49", "remaining_time": "1:19:36", "throughput": 3349.99, "total_tokens": 202370416} +{"current_steps": 166425, "total_steps": 179580, "loss": 0.6624, "lr": 8.129961871752939e-07, "epoch": 18.534914801202806, "percentage": 92.67, "elapsed_time": "16:46:51", "remaining_time": "1:19:35", "throughput": 3349.99, "total_tokens": 202376464} +{"current_steps": 166430, "total_steps": 179580, "loss": 0.7288, "lr": 8.123817066689659e-07, "epoch": 18.535471656086425, "percentage": 92.68, "elapsed_time": "16:46:52", "remaining_time": "1:19:33", "throughput": 3349.99, "total_tokens": 202382480} +{"current_steps": 166435, "total_steps": 179580, "loss": 0.6897, "lr": 8.117674546340714e-07, "epoch": 18.53602851097004, "percentage": 92.68, "elapsed_time": "16:46:54", "remaining_time": "1:19:31", "throughput": 3350.0, "total_tokens": 202388656} +{"current_steps": 166440, "total_steps": 179580, "loss": 0.6167, "lr": 8.111534310764113e-07, "epoch": 18.536585365853657, "percentage": 92.68, "elapsed_time": "16:46:56", "remaining_time": "1:19:29", "throughput": 3350.0, "total_tokens": 202395120} +{"current_steps": 166445, "total_steps": 179580, "loss": 0.8036, "lr": 8.105396360017892e-07, "epoch": 18.537142220737277, "percentage": 92.69, "elapsed_time": "16:46:58", "remaining_time": "1:19:27", "throughput": 3350.0, "total_tokens": 202400944} +{"current_steps": 166450, "total_steps": 179580, "loss": 0.8693, "lr": 8.099260694160004e-07, "epoch": 18.537699075620893, "percentage": 92.69, "elapsed_time": "16:46:59", "remaining_time": "1:19:26", "throughput": 3350.01, "total_tokens": 202407120} +{"current_steps": 166455, "total_steps": 179580, "loss": 0.6714, "lr": 8.093127313248406e-07, "epoch": 18.538255930504512, "percentage": 92.69, "elapsed_time": "16:47:01", "remaining_time": "1:19:24", "throughput": 3350.01, "total_tokens": 202413072} +{"current_steps": 166460, "total_steps": 179580, "loss": 1.1385, "lr": 8.086996217341019e-07, "epoch": 18.538812785388128, "percentage": 92.69, "elapsed_time": "16:47:03", "remaining_time": "1:19:22", "throughput": 3350.01, "total_tokens": 202419056} +{"current_steps": 166465, "total_steps": 179580, "loss": 0.5752, "lr": 8.080867406495773e-07, "epoch": 18.539369640271744, "percentage": 92.7, "elapsed_time": "16:47:05", "remaining_time": "1:19:20", "throughput": 3350.02, "total_tokens": 202425200} +{"current_steps": 166470, "total_steps": 179580, "loss": 0.9999, "lr": 8.074740880770565e-07, "epoch": 18.539926495155363, "percentage": 92.7, "elapsed_time": "16:47:06", "remaining_time": "1:19:18", "throughput": 3350.02, "total_tokens": 202431024} +{"current_steps": 166475, "total_steps": 179580, "loss": 0.8323, "lr": 8.068616640223264e-07, "epoch": 18.54048335003898, "percentage": 92.7, "elapsed_time": "16:47:08", "remaining_time": "1:19:16", "throughput": 3350.02, "total_tokens": 202437040} +{"current_steps": 166480, "total_steps": 179580, "loss": 0.8934, "lr": 8.062494684911687e-07, "epoch": 18.5410402049226, "percentage": 92.71, "elapsed_time": "16:47:10", "remaining_time": "1:19:15", "throughput": 3350.02, "total_tokens": 202442640} +{"current_steps": 166485, "total_steps": 179580, "loss": 0.5388, "lr": 8.056375014893703e-07, "epoch": 18.541597059806215, "percentage": 92.71, "elapsed_time": "16:47:12", "remaining_time": "1:19:13", "throughput": 3350.03, "total_tokens": 202448848} +{"current_steps": 166490, "total_steps": 179580, "loss": 0.6945, "lr": 8.05025763022707e-07, "epoch": 18.54215391468983, "percentage": 92.71, "elapsed_time": "16:47:13", "remaining_time": "1:19:11", "throughput": 3350.03, "total_tokens": 202455152} +{"current_steps": 166495, "total_steps": 179580, "loss": 0.9772, "lr": 8.044142530969661e-07, "epoch": 18.54271076957345, "percentage": 92.71, "elapsed_time": "16:47:15", "remaining_time": "1:19:09", "throughput": 3350.03, "total_tokens": 202461264} +{"current_steps": 166500, "total_steps": 179580, "loss": 0.7073, "lr": 8.038029717179124e-07, "epoch": 18.543267624457066, "percentage": 92.72, "elapsed_time": "16:47:17", "remaining_time": "1:19:07", "throughput": 3350.04, "total_tokens": 202467280} +{"current_steps": 166505, "total_steps": 179580, "loss": 0.6336, "lr": 8.031919188913273e-07, "epoch": 18.543824479340685, "percentage": 92.72, "elapsed_time": "16:47:19", "remaining_time": "1:19:06", "throughput": 3350.04, "total_tokens": 202473392} +{"current_steps": 166510, "total_steps": 179580, "loss": 0.8507, "lr": 8.025810946229784e-07, "epoch": 18.5443813342243, "percentage": 92.72, "elapsed_time": "16:47:20", "remaining_time": "1:19:04", "throughput": 3350.04, "total_tokens": 202479568} +{"current_steps": 166515, "total_steps": 179580, "loss": 0.8711, "lr": 8.019704989186416e-07, "epoch": 18.544938189107917, "percentage": 92.72, "elapsed_time": "16:47:22", "remaining_time": "1:19:02", "throughput": 3350.05, "total_tokens": 202485552} +{"current_steps": 166520, "total_steps": 179580, "loss": 0.7623, "lr": 8.013601317840791e-07, "epoch": 18.545495043991536, "percentage": 92.73, "elapsed_time": "16:47:24", "remaining_time": "1:19:00", "throughput": 3350.05, "total_tokens": 202491824} +{"current_steps": 166525, "total_steps": 179580, "loss": 0.7854, "lr": 8.007499932250583e-07, "epoch": 18.546051898875152, "percentage": 92.73, "elapsed_time": "16:47:26", "remaining_time": "1:18:58", "throughput": 3350.05, "total_tokens": 202497808} +{"current_steps": 166530, "total_steps": 179580, "loss": 0.7583, "lr": 8.001400832473388e-07, "epoch": 18.546608753758772, "percentage": 92.73, "elapsed_time": "16:47:27", "remaining_time": "1:18:56", "throughput": 3350.06, "total_tokens": 202503696} +{"current_steps": 166535, "total_steps": 179580, "loss": 0.5567, "lr": 7.995304018566879e-07, "epoch": 18.547165608642388, "percentage": 92.74, "elapsed_time": "16:47:29", "remaining_time": "1:18:55", "throughput": 3350.06, "total_tokens": 202510032} +{"current_steps": 166540, "total_steps": 179580, "loss": 0.6668, "lr": 7.989209490588595e-07, "epoch": 18.547722463526004, "percentage": 92.74, "elapsed_time": "16:47:31", "remaining_time": "1:18:53", "throughput": 3350.07, "total_tokens": 202516112} +{"current_steps": 166545, "total_steps": 179580, "loss": 0.6433, "lr": 7.983117248596156e-07, "epoch": 18.548279318409623, "percentage": 92.74, "elapsed_time": "16:47:33", "remaining_time": "1:18:51", "throughput": 3350.07, "total_tokens": 202522224} +{"current_steps": 166550, "total_steps": 179580, "loss": 0.7503, "lr": 7.977027292647016e-07, "epoch": 18.54883617329324, "percentage": 92.74, "elapsed_time": "16:47:35", "remaining_time": "1:18:49", "throughput": 3350.07, "total_tokens": 202528752} +{"current_steps": 166555, "total_steps": 179580, "loss": 0.795, "lr": 7.970939622798823e-07, "epoch": 18.54939302817686, "percentage": 92.75, "elapsed_time": "16:47:36", "remaining_time": "1:18:47", "throughput": 3350.08, "total_tokens": 202534736} +{"current_steps": 166560, "total_steps": 179580, "loss": 0.7147, "lr": 7.964854239108949e-07, "epoch": 18.549949883060474, "percentage": 92.75, "elapsed_time": "16:47:38", "remaining_time": "1:18:46", "throughput": 3350.08, "total_tokens": 202540944} +{"current_steps": 166565, "total_steps": 179580, "loss": 0.5732, "lr": 7.958771141635013e-07, "epoch": 18.55050673794409, "percentage": 92.75, "elapsed_time": "16:47:40", "remaining_time": "1:18:44", "throughput": 3350.08, "total_tokens": 202546768} +{"current_steps": 166570, "total_steps": 179580, "loss": 0.6308, "lr": 7.952690330434359e-07, "epoch": 18.55106359282771, "percentage": 92.76, "elapsed_time": "16:47:41", "remaining_time": "1:18:42", "throughput": 3350.08, "total_tokens": 202552592} +{"current_steps": 166575, "total_steps": 179580, "loss": 0.9554, "lr": 7.946611805564497e-07, "epoch": 18.551620447711326, "percentage": 92.76, "elapsed_time": "16:47:43", "remaining_time": "1:18:40", "throughput": 3350.09, "total_tokens": 202558512} +{"current_steps": 166580, "total_steps": 179580, "loss": 0.7035, "lr": 7.940535567082797e-07, "epoch": 18.552177302594945, "percentage": 92.76, "elapsed_time": "16:47:45", "remaining_time": "1:18:38", "throughput": 3350.09, "total_tokens": 202564688} +{"current_steps": 166585, "total_steps": 179580, "loss": 0.7241, "lr": 7.934461615046684e-07, "epoch": 18.55273415747856, "percentage": 92.76, "elapsed_time": "16:47:47", "remaining_time": "1:18:36", "throughput": 3350.09, "total_tokens": 202570960} +{"current_steps": 166590, "total_steps": 179580, "loss": 0.5588, "lr": 7.928389949513504e-07, "epoch": 18.553291012362177, "percentage": 92.77, "elapsed_time": "16:47:49", "remaining_time": "1:18:35", "throughput": 3350.1, "total_tokens": 202577232} +{"current_steps": 166595, "total_steps": 179580, "loss": 0.8335, "lr": 7.922320570540653e-07, "epoch": 18.553847867245796, "percentage": 92.77, "elapsed_time": "16:47:50", "remaining_time": "1:18:33", "throughput": 3350.1, "total_tokens": 202583568} +{"current_steps": 166600, "total_steps": 179580, "loss": 0.8439, "lr": 7.91625347818542e-07, "epoch": 18.554404722129412, "percentage": 92.77, "elapsed_time": "16:47:52", "remaining_time": "1:18:31", "throughput": 3350.11, "total_tokens": 202589808} +{"current_steps": 166605, "total_steps": 179580, "loss": 0.6194, "lr": 7.91018867250512e-07, "epoch": 18.55496157701303, "percentage": 92.77, "elapsed_time": "16:47:54", "remaining_time": "1:18:29", "throughput": 3350.11, "total_tokens": 202595728} +{"current_steps": 166610, "total_steps": 179580, "loss": 0.8645, "lr": 7.90412615355704e-07, "epoch": 18.555518431896648, "percentage": 92.78, "elapsed_time": "16:47:56", "remaining_time": "1:18:27", "throughput": 3350.11, "total_tokens": 202601648} +{"current_steps": 166615, "total_steps": 179580, "loss": 0.7495, "lr": 7.898065921398495e-07, "epoch": 18.556075286780263, "percentage": 92.78, "elapsed_time": "16:47:57", "remaining_time": "1:18:26", "throughput": 3350.12, "total_tokens": 202607856} +{"current_steps": 166620, "total_steps": 179580, "loss": 0.9422, "lr": 7.892007976086663e-07, "epoch": 18.556632141663883, "percentage": 92.78, "elapsed_time": "16:47:59", "remaining_time": "1:18:24", "throughput": 3350.12, "total_tokens": 202614096} +{"current_steps": 166625, "total_steps": 179580, "loss": 0.8173, "lr": 7.885952317678747e-07, "epoch": 18.5571889965475, "percentage": 92.79, "elapsed_time": "16:48:01", "remaining_time": "1:18:22", "throughput": 3350.12, "total_tokens": 202620240} +{"current_steps": 166630, "total_steps": 179580, "loss": 0.7662, "lr": 7.879898946232034e-07, "epoch": 18.557745851431118, "percentage": 92.79, "elapsed_time": "16:48:03", "remaining_time": "1:18:20", "throughput": 3350.13, "total_tokens": 202626704} +{"current_steps": 166635, "total_steps": 179580, "loss": 0.629, "lr": 7.873847861803646e-07, "epoch": 18.558302706314734, "percentage": 92.79, "elapsed_time": "16:48:05", "remaining_time": "1:18:18", "throughput": 3350.13, "total_tokens": 202632528} +{"current_steps": 166640, "total_steps": 179580, "loss": 0.6763, "lr": 7.867799064450787e-07, "epoch": 18.55885956119835, "percentage": 92.79, "elapsed_time": "16:48:06", "remaining_time": "1:18:16", "throughput": 3350.13, "total_tokens": 202638576} +{"current_steps": 166645, "total_steps": 179580, "loss": 0.5533, "lr": 7.861752554230494e-07, "epoch": 18.55941641608197, "percentage": 92.8, "elapsed_time": "16:48:08", "remaining_time": "1:18:15", "throughput": 3350.13, "total_tokens": 202644976} +{"current_steps": 166650, "total_steps": 179580, "loss": 0.6674, "lr": 7.855708331200001e-07, "epoch": 18.559973270965585, "percentage": 92.8, "elapsed_time": "16:48:10", "remaining_time": "1:18:13", "throughput": 3350.14, "total_tokens": 202651728} +{"current_steps": 166655, "total_steps": 179580, "loss": 0.6808, "lr": 7.849666395416289e-07, "epoch": 18.560530125849205, "percentage": 92.8, "elapsed_time": "16:48:12", "remaining_time": "1:18:11", "throughput": 3350.14, "total_tokens": 202658032} +{"current_steps": 166660, "total_steps": 179580, "loss": 0.6093, "lr": 7.843626746936534e-07, "epoch": 18.56108698073282, "percentage": 92.81, "elapsed_time": "16:48:14", "remaining_time": "1:18:09", "throughput": 3350.15, "total_tokens": 202664016} +{"current_steps": 166665, "total_steps": 179580, "loss": 0.7158, "lr": 7.837589385817746e-07, "epoch": 18.561643835616437, "percentage": 92.81, "elapsed_time": "16:48:15", "remaining_time": "1:18:07", "throughput": 3350.15, "total_tokens": 202669616} +{"current_steps": 166670, "total_steps": 179580, "loss": 0.7696, "lr": 7.831554312116934e-07, "epoch": 18.562200690500056, "percentage": 92.81, "elapsed_time": "16:48:17", "remaining_time": "1:18:06", "throughput": 3350.15, "total_tokens": 202675888} +{"current_steps": 166675, "total_steps": 179580, "loss": 0.4453, "lr": 7.825521525891083e-07, "epoch": 18.562757545383672, "percentage": 92.81, "elapsed_time": "16:48:19", "remaining_time": "1:18:04", "throughput": 3350.15, "total_tokens": 202682064} +{"current_steps": 166680, "total_steps": 179580, "loss": 0.4813, "lr": 7.819491027197228e-07, "epoch": 18.56331440026729, "percentage": 92.82, "elapsed_time": "16:48:21", "remaining_time": "1:18:02", "throughput": 3350.16, "total_tokens": 202688112} +{"current_steps": 166685, "total_steps": 179580, "loss": 0.7199, "lr": 7.813462816092326e-07, "epoch": 18.563871255150907, "percentage": 92.82, "elapsed_time": "16:48:22", "remaining_time": "1:18:00", "throughput": 3350.16, "total_tokens": 202694608} +{"current_steps": 166690, "total_steps": 179580, "loss": 0.7039, "lr": 7.807436892633274e-07, "epoch": 18.564428110034527, "percentage": 92.82, "elapsed_time": "16:48:24", "remaining_time": "1:17:58", "throughput": 3350.17, "total_tokens": 202700624} +{"current_steps": 166695, "total_steps": 179580, "loss": 0.6233, "lr": 7.801413256877027e-07, "epoch": 18.564984964918143, "percentage": 92.82, "elapsed_time": "16:48:26", "remaining_time": "1:17:56", "throughput": 3350.17, "total_tokens": 202706672} +{"current_steps": 166700, "total_steps": 179580, "loss": 0.9539, "lr": 7.795391908880511e-07, "epoch": 18.56554181980176, "percentage": 92.83, "elapsed_time": "16:48:28", "remaining_time": "1:17:55", "throughput": 3350.17, "total_tokens": 202712624} +{"current_steps": 166705, "total_steps": 179580, "loss": 0.7269, "lr": 7.789372848700516e-07, "epoch": 18.566098674685378, "percentage": 92.83, "elapsed_time": "16:48:29", "remaining_time": "1:17:53", "throughput": 3350.17, "total_tokens": 202718960} +{"current_steps": 166710, "total_steps": 179580, "loss": 0.4208, "lr": 7.783356076393994e-07, "epoch": 18.566655529568994, "percentage": 92.83, "elapsed_time": "16:48:31", "remaining_time": "1:17:51", "throughput": 3350.18, "total_tokens": 202724880} +{"current_steps": 166715, "total_steps": 179580, "loss": 0.9564, "lr": 7.777341592017734e-07, "epoch": 18.567212384452613, "percentage": 92.84, "elapsed_time": "16:48:33", "remaining_time": "1:17:49", "throughput": 3350.18, "total_tokens": 202730768} +{"current_steps": 166720, "total_steps": 179580, "loss": 0.7604, "lr": 7.771329395628524e-07, "epoch": 18.56776923933623, "percentage": 92.84, "elapsed_time": "16:48:35", "remaining_time": "1:17:47", "throughput": 3350.18, "total_tokens": 202737104} +{"current_steps": 166725, "total_steps": 179580, "loss": 0.6885, "lr": 7.76531948728318e-07, "epoch": 18.568326094219845, "percentage": 92.84, "elapsed_time": "16:48:36", "remaining_time": "1:17:46", "throughput": 3350.19, "total_tokens": 202743024} +{"current_steps": 166730, "total_steps": 179580, "loss": 0.7147, "lr": 7.759311867038488e-07, "epoch": 18.568882949103465, "percentage": 92.84, "elapsed_time": "16:48:38", "remaining_time": "1:17:44", "throughput": 3350.19, "total_tokens": 202749232} +{"current_steps": 166735, "total_steps": 179580, "loss": 0.6734, "lr": 7.753306534951182e-07, "epoch": 18.56943980398708, "percentage": 92.85, "elapsed_time": "16:48:40", "remaining_time": "1:17:42", "throughput": 3350.19, "total_tokens": 202755344} +{"current_steps": 166740, "total_steps": 179580, "loss": 0.6439, "lr": 7.747303491077967e-07, "epoch": 18.5699966588707, "percentage": 92.85, "elapsed_time": "16:48:42", "remaining_time": "1:17:40", "throughput": 3350.2, "total_tokens": 202761648} +{"current_steps": 166745, "total_steps": 179580, "loss": 0.5989, "lr": 7.741302735475548e-07, "epoch": 18.570553513754316, "percentage": 92.85, "elapsed_time": "16:48:44", "remaining_time": "1:17:38", "throughput": 3350.2, "total_tokens": 202768016} +{"current_steps": 166750, "total_steps": 179580, "loss": 0.6493, "lr": 7.735304268200627e-07, "epoch": 18.57111036863793, "percentage": 92.86, "elapsed_time": "16:48:45", "remaining_time": "1:17:36", "throughput": 3350.21, "total_tokens": 202774256} +{"current_steps": 166755, "total_steps": 179580, "loss": 0.788, "lr": 7.729308089309856e-07, "epoch": 18.57166722352155, "percentage": 92.86, "elapsed_time": "16:48:47", "remaining_time": "1:17:35", "throughput": 3350.21, "total_tokens": 202780016} +{"current_steps": 166760, "total_steps": 179580, "loss": 0.5489, "lr": 7.723314198859883e-07, "epoch": 18.572224078405167, "percentage": 92.86, "elapsed_time": "16:48:49", "remaining_time": "1:17:33", "throughput": 3350.21, "total_tokens": 202786000} +{"current_steps": 166765, "total_steps": 179580, "loss": 0.5431, "lr": 7.7173225969073e-07, "epoch": 18.572780933288787, "percentage": 92.86, "elapsed_time": "16:48:51", "remaining_time": "1:17:31", "throughput": 3350.22, "total_tokens": 202792048} +{"current_steps": 166770, "total_steps": 179580, "loss": 0.6291, "lr": 7.711333283508731e-07, "epoch": 18.573337788172402, "percentage": 92.87, "elapsed_time": "16:48:52", "remaining_time": "1:17:29", "throughput": 3350.22, "total_tokens": 202798064} +{"current_steps": 166775, "total_steps": 179580, "loss": 0.6335, "lr": 7.705346258720713e-07, "epoch": 18.57389464305602, "percentage": 92.87, "elapsed_time": "16:48:54", "remaining_time": "1:17:27", "throughput": 3350.22, "total_tokens": 202804208} +{"current_steps": 166780, "total_steps": 179580, "loss": 0.6711, "lr": 7.699361522599868e-07, "epoch": 18.574451497939638, "percentage": 92.87, "elapsed_time": "16:48:56", "remaining_time": "1:17:26", "throughput": 3350.22, "total_tokens": 202810288} +{"current_steps": 166785, "total_steps": 179580, "loss": 0.6794, "lr": 7.693379075202651e-07, "epoch": 18.575008352823254, "percentage": 92.88, "elapsed_time": "16:48:58", "remaining_time": "1:17:24", "throughput": 3350.23, "total_tokens": 202816304} +{"current_steps": 166790, "total_steps": 179580, "loss": 0.6997, "lr": 7.687398916585625e-07, "epoch": 18.575565207706873, "percentage": 92.88, "elapsed_time": "16:48:59", "remaining_time": "1:17:22", "throughput": 3350.23, "total_tokens": 202822640} +{"current_steps": 166795, "total_steps": 179580, "loss": 0.8699, "lr": 7.681421046805221e-07, "epoch": 18.57612206259049, "percentage": 92.88, "elapsed_time": "16:49:01", "remaining_time": "1:17:20", "throughput": 3350.23, "total_tokens": 202828816} +{"current_steps": 166800, "total_steps": 179580, "loss": 0.6982, "lr": 7.675445465917974e-07, "epoch": 18.576678917474105, "percentage": 92.88, "elapsed_time": "16:49:03", "remaining_time": "1:17:18", "throughput": 3350.24, "total_tokens": 202834832} +{"current_steps": 166805, "total_steps": 179580, "loss": 0.9936, "lr": 7.669472173980257e-07, "epoch": 18.577235772357724, "percentage": 92.89, "elapsed_time": "16:49:05", "remaining_time": "1:17:16", "throughput": 3350.24, "total_tokens": 202841008} +{"current_steps": 166810, "total_steps": 179580, "loss": 0.8922, "lr": 7.663501171048554e-07, "epoch": 18.57779262724134, "percentage": 92.89, "elapsed_time": "16:49:07", "remaining_time": "1:17:15", "throughput": 3350.24, "total_tokens": 202847472} +{"current_steps": 166815, "total_steps": 179580, "loss": 0.8613, "lr": 7.657532457179206e-07, "epoch": 18.57834948212496, "percentage": 92.89, "elapsed_time": "16:49:08", "remaining_time": "1:17:13", "throughput": 3350.25, "total_tokens": 202853264} +{"current_steps": 166820, "total_steps": 179580, "loss": 0.8194, "lr": 7.65156603242867e-07, "epoch": 18.578906337008576, "percentage": 92.89, "elapsed_time": "16:49:10", "remaining_time": "1:17:11", "throughput": 3350.25, "total_tokens": 202859152} +{"current_steps": 166825, "total_steps": 179580, "loss": 0.8101, "lr": 7.645601896853205e-07, "epoch": 18.57946319189219, "percentage": 92.9, "elapsed_time": "16:49:12", "remaining_time": "1:17:09", "throughput": 3350.25, "total_tokens": 202865136} +{"current_steps": 166830, "total_steps": 179580, "loss": 0.8779, "lr": 7.639640050509267e-07, "epoch": 18.58002004677581, "percentage": 92.9, "elapsed_time": "16:49:13", "remaining_time": "1:17:07", "throughput": 3350.26, "total_tokens": 202871280} +{"current_steps": 166835, "total_steps": 179580, "loss": 0.6596, "lr": 7.63368049345306e-07, "epoch": 18.580576901659427, "percentage": 92.9, "elapsed_time": "16:49:15", "remaining_time": "1:17:06", "throughput": 3350.26, "total_tokens": 202876912} +{"current_steps": 166840, "total_steps": 179580, "loss": 0.7715, "lr": 7.627723225740929e-07, "epoch": 18.581133756543046, "percentage": 92.91, "elapsed_time": "16:49:17", "remaining_time": "1:17:04", "throughput": 3350.26, "total_tokens": 202883088} +{"current_steps": 166845, "total_steps": 179580, "loss": 0.5971, "lr": 7.621768247429134e-07, "epoch": 18.581690611426662, "percentage": 92.91, "elapsed_time": "16:49:19", "remaining_time": "1:17:02", "throughput": 3350.27, "total_tokens": 202889008} +{"current_steps": 166850, "total_steps": 179580, "loss": 0.5065, "lr": 7.615815558573936e-07, "epoch": 18.582247466310278, "percentage": 92.91, "elapsed_time": "16:49:20", "remaining_time": "1:17:00", "throughput": 3350.27, "total_tokens": 202895280} +{"current_steps": 166855, "total_steps": 179580, "loss": 0.6904, "lr": 7.609865159231566e-07, "epoch": 18.582804321193898, "percentage": 92.91, "elapsed_time": "16:49:22", "remaining_time": "1:16:58", "throughput": 3350.27, "total_tokens": 202901424} +{"current_steps": 166860, "total_steps": 179580, "loss": 0.6449, "lr": 7.603917049458203e-07, "epoch": 18.583361176077513, "percentage": 92.92, "elapsed_time": "16:49:24", "remaining_time": "1:16:56", "throughput": 3350.28, "total_tokens": 202907280} +{"current_steps": 166865, "total_steps": 179580, "loss": 1.0599, "lr": 7.597971229310025e-07, "epoch": 18.583918030961133, "percentage": 92.92, "elapsed_time": "16:49:26", "remaining_time": "1:16:55", "throughput": 3350.28, "total_tokens": 202913232} +{"current_steps": 166870, "total_steps": 179580, "loss": 0.6832, "lr": 7.592027698843263e-07, "epoch": 18.58447488584475, "percentage": 92.92, "elapsed_time": "16:49:27", "remaining_time": "1:16:53", "throughput": 3350.28, "total_tokens": 202919568} +{"current_steps": 166875, "total_steps": 179580, "loss": 0.8461, "lr": 7.586086458114011e-07, "epoch": 18.585031740728365, "percentage": 92.93, "elapsed_time": "16:49:29", "remaining_time": "1:16:51", "throughput": 3350.29, "total_tokens": 202925424} +{"current_steps": 166880, "total_steps": 179580, "loss": 0.6408, "lr": 7.580147507178364e-07, "epoch": 18.585588595611984, "percentage": 92.93, "elapsed_time": "16:49:31", "remaining_time": "1:16:49", "throughput": 3350.29, "total_tokens": 202931696} +{"current_steps": 166885, "total_steps": 179580, "loss": 0.7942, "lr": 7.574210846092444e-07, "epoch": 18.5861454504956, "percentage": 92.93, "elapsed_time": "16:49:33", "remaining_time": "1:16:47", "throughput": 3350.29, "total_tokens": 202937872} +{"current_steps": 166890, "total_steps": 179580, "loss": 0.8035, "lr": 7.568276474912372e-07, "epoch": 18.58670230537922, "percentage": 92.93, "elapsed_time": "16:49:34", "remaining_time": "1:16:45", "throughput": 3350.3, "total_tokens": 202943408} +{"current_steps": 166895, "total_steps": 179580, "loss": 0.7188, "lr": 7.562344393694104e-07, "epoch": 18.587259160262835, "percentage": 92.94, "elapsed_time": "16:49:36", "remaining_time": "1:16:44", "throughput": 3350.3, "total_tokens": 202949936} +{"current_steps": 166900, "total_steps": 179580, "loss": 0.5899, "lr": 7.556414602493788e-07, "epoch": 18.58781601514645, "percentage": 92.94, "elapsed_time": "16:49:38", "remaining_time": "1:16:42", "throughput": 3350.3, "total_tokens": 202955600} +{"current_steps": 166905, "total_steps": 179580, "loss": 0.7223, "lr": 7.550487101367354e-07, "epoch": 18.58837287003007, "percentage": 92.94, "elapsed_time": "16:49:40", "remaining_time": "1:16:40", "throughput": 3350.3, "total_tokens": 202961840} +{"current_steps": 166910, "total_steps": 179580, "loss": 0.7688, "lr": 7.54456189037081e-07, "epoch": 18.588929724913687, "percentage": 92.94, "elapsed_time": "16:49:41", "remaining_time": "1:16:38", "throughput": 3350.3, "total_tokens": 202967504} +{"current_steps": 166915, "total_steps": 179580, "loss": 1.0874, "lr": 7.538638969560114e-07, "epoch": 18.589486579797306, "percentage": 92.95, "elapsed_time": "16:49:43", "remaining_time": "1:16:36", "throughput": 3350.3, "total_tokens": 202972688} +{"current_steps": 166920, "total_steps": 179580, "loss": 0.5682, "lr": 7.532718338991273e-07, "epoch": 18.590043434680922, "percentage": 92.95, "elapsed_time": "16:49:45", "remaining_time": "1:16:35", "throughput": 3350.31, "total_tokens": 202979024} +{"current_steps": 166925, "total_steps": 179580, "loss": 0.678, "lr": 7.526799998720135e-07, "epoch": 18.590600289564538, "percentage": 92.95, "elapsed_time": "16:49:46", "remaining_time": "1:16:33", "throughput": 3350.31, "total_tokens": 202984368} +{"current_steps": 166930, "total_steps": 179580, "loss": 0.5204, "lr": 7.520883948802682e-07, "epoch": 18.591157144448157, "percentage": 92.96, "elapsed_time": "16:49:48", "remaining_time": "1:16:31", "throughput": 3350.32, "total_tokens": 202990768} +{"current_steps": 166935, "total_steps": 179580, "loss": 0.7257, "lr": 7.514970189294701e-07, "epoch": 18.591713999331773, "percentage": 92.96, "elapsed_time": "16:49:50", "remaining_time": "1:16:29", "throughput": 3350.32, "total_tokens": 202997072} +{"current_steps": 166940, "total_steps": 179580, "loss": 0.6081, "lr": 7.509058720252121e-07, "epoch": 18.592270854215393, "percentage": 92.96, "elapsed_time": "16:49:51", "remaining_time": "1:16:27", "throughput": 3350.32, "total_tokens": 203002704} +{"current_steps": 166945, "total_steps": 179580, "loss": 0.6734, "lr": 7.503149541730758e-07, "epoch": 18.59282770909901, "percentage": 92.96, "elapsed_time": "16:49:53", "remaining_time": "1:16:25", "throughput": 3350.33, "total_tokens": 203008848} +{"current_steps": 166950, "total_steps": 179580, "loss": 0.4878, "lr": 7.497242653786457e-07, "epoch": 18.593384563982625, "percentage": 92.97, "elapsed_time": "16:49:55", "remaining_time": "1:16:24", "throughput": 3350.33, "total_tokens": 203014320} +{"current_steps": 166955, "total_steps": 179580, "loss": 0.9239, "lr": 7.49133805647495e-07, "epoch": 18.593941418866244, "percentage": 92.97, "elapsed_time": "16:49:57", "remaining_time": "1:16:22", "throughput": 3350.33, "total_tokens": 203020336} +{"current_steps": 166960, "total_steps": 179580, "loss": 0.6528, "lr": 7.485435749852083e-07, "epoch": 18.59449827374986, "percentage": 92.97, "elapsed_time": "16:49:58", "remaining_time": "1:16:20", "throughput": 3350.33, "total_tokens": 203026544} +{"current_steps": 166965, "total_steps": 179580, "loss": 0.5746, "lr": 7.47953573397353e-07, "epoch": 18.59505512863348, "percentage": 92.98, "elapsed_time": "16:50:00", "remaining_time": "1:16:18", "throughput": 3350.34, "total_tokens": 203032912} +{"current_steps": 166970, "total_steps": 179580, "loss": 0.6256, "lr": 7.473638008895112e-07, "epoch": 18.595611983517095, "percentage": 92.98, "elapsed_time": "16:50:02", "remaining_time": "1:16:16", "throughput": 3350.34, "total_tokens": 203039280} +{"current_steps": 166975, "total_steps": 179580, "loss": 0.5222, "lr": 7.467742574672476e-07, "epoch": 18.59616883840071, "percentage": 92.98, "elapsed_time": "16:50:04", "remaining_time": "1:16:15", "throughput": 3350.34, "total_tokens": 203044848} +{"current_steps": 166980, "total_steps": 179580, "loss": 0.7692, "lr": 7.461849431361329e-07, "epoch": 18.59672569328433, "percentage": 92.98, "elapsed_time": "16:50:05", "remaining_time": "1:16:13", "throughput": 3350.35, "total_tokens": 203051088} +{"current_steps": 166985, "total_steps": 179580, "loss": 0.7397, "lr": 7.455958579017319e-07, "epoch": 18.597282548167946, "percentage": 92.99, "elapsed_time": "16:50:07", "remaining_time": "1:16:11", "throughput": 3350.35, "total_tokens": 203057360} +{"current_steps": 166990, "total_steps": 179580, "loss": 0.7383, "lr": 7.450070017696098e-07, "epoch": 18.597839403051566, "percentage": 92.99, "elapsed_time": "16:50:09", "remaining_time": "1:16:09", "throughput": 3350.36, "total_tokens": 203063536} +{"current_steps": 166995, "total_steps": 179580, "loss": 0.5838, "lr": 7.444183747453342e-07, "epoch": 18.598396257935182, "percentage": 92.99, "elapsed_time": "16:50:11", "remaining_time": "1:16:07", "throughput": 3350.36, "total_tokens": 203069904} +{"current_steps": 167000, "total_steps": 179580, "loss": 0.9277, "lr": 7.438299768344564e-07, "epoch": 18.598953112818798, "percentage": 92.99, "elapsed_time": "16:50:13", "remaining_time": "1:16:05", "throughput": 3350.36, "total_tokens": 203075792} +{"current_steps": 167005, "total_steps": 179580, "loss": 0.4435, "lr": 7.432418080425385e-07, "epoch": 18.599509967702417, "percentage": 93.0, "elapsed_time": "16:50:14", "remaining_time": "1:16:04", "throughput": 3350.37, "total_tokens": 203082256} +{"current_steps": 167010, "total_steps": 179580, "loss": 0.7081, "lr": 7.426538683751344e-07, "epoch": 18.600066822586033, "percentage": 93.0, "elapsed_time": "16:50:16", "remaining_time": "1:16:02", "throughput": 3350.37, "total_tokens": 203088976} +{"current_steps": 167015, "total_steps": 179580, "loss": 0.6215, "lr": 7.420661578378036e-07, "epoch": 18.600623677469653, "percentage": 93.0, "elapsed_time": "16:50:18", "remaining_time": "1:16:00", "throughput": 3350.38, "total_tokens": 203095184} +{"current_steps": 167020, "total_steps": 179580, "loss": 0.6157, "lr": 7.414786764360887e-07, "epoch": 18.60118053235327, "percentage": 93.01, "elapsed_time": "16:50:20", "remaining_time": "1:15:58", "throughput": 3350.38, "total_tokens": 203101328} +{"current_steps": 167025, "total_steps": 179580, "loss": 0.9991, "lr": 7.408914241755466e-07, "epoch": 18.601737387236888, "percentage": 93.01, "elapsed_time": "16:50:22", "remaining_time": "1:15:56", "throughput": 3350.38, "total_tokens": 203106832} +{"current_steps": 167030, "total_steps": 179580, "loss": 0.6314, "lr": 7.403044010617172e-07, "epoch": 18.602294242120504, "percentage": 93.01, "elapsed_time": "16:50:23", "remaining_time": "1:15:55", "throughput": 3350.38, "total_tokens": 203113040} +{"current_steps": 167035, "total_steps": 179580, "loss": 0.7003, "lr": 7.397176071001544e-07, "epoch": 18.60285109700412, "percentage": 93.01, "elapsed_time": "16:50:25", "remaining_time": "1:15:53", "throughput": 3350.39, "total_tokens": 203118832} +{"current_steps": 167040, "total_steps": 179580, "loss": 1.0263, "lr": 7.391310422963898e-07, "epoch": 18.60340795188774, "percentage": 93.02, "elapsed_time": "16:50:27", "remaining_time": "1:15:51", "throughput": 3350.39, "total_tokens": 203124912} +{"current_steps": 167045, "total_steps": 179580, "loss": 0.6787, "lr": 7.385447066559775e-07, "epoch": 18.603964806771355, "percentage": 93.02, "elapsed_time": "16:50:29", "remaining_time": "1:15:49", "throughput": 3350.39, "total_tokens": 203131216} +{"current_steps": 167050, "total_steps": 179580, "loss": 0.8512, "lr": 7.379586001844407e-07, "epoch": 18.60452166165497, "percentage": 93.02, "elapsed_time": "16:50:30", "remaining_time": "1:15:47", "throughput": 3350.39, "total_tokens": 203137488} +{"current_steps": 167055, "total_steps": 179580, "loss": 0.7428, "lr": 7.373727228873279e-07, "epoch": 18.60507851653859, "percentage": 93.03, "elapsed_time": "16:50:32", "remaining_time": "1:15:45", "throughput": 3350.4, "total_tokens": 203143824} +{"current_steps": 167060, "total_steps": 179580, "loss": 0.5298, "lr": 7.367870747701649e-07, "epoch": 18.605635371422206, "percentage": 93.03, "elapsed_time": "16:50:34", "remaining_time": "1:15:44", "throughput": 3350.4, "total_tokens": 203149936} +{"current_steps": 167065, "total_steps": 179580, "loss": 0.6362, "lr": 7.362016558384921e-07, "epoch": 18.606192226305826, "percentage": 93.03, "elapsed_time": "16:50:36", "remaining_time": "1:15:42", "throughput": 3350.41, "total_tokens": 203155600} +{"current_steps": 167070, "total_steps": 179580, "loss": 0.7913, "lr": 7.356164660978326e-07, "epoch": 18.60674908118944, "percentage": 93.03, "elapsed_time": "16:50:37", "remaining_time": "1:15:40", "throughput": 3350.41, "total_tokens": 203161392} +{"current_steps": 167075, "total_steps": 179580, "loss": 0.7776, "lr": 7.350315055537155e-07, "epoch": 18.60730593607306, "percentage": 93.04, "elapsed_time": "16:50:39", "remaining_time": "1:15:38", "throughput": 3350.41, "total_tokens": 203167376} +{"current_steps": 167080, "total_steps": 179580, "loss": 0.7102, "lr": 7.34446774211664e-07, "epoch": 18.607862790956677, "percentage": 93.04, "elapsed_time": "16:50:41", "remaining_time": "1:15:36", "throughput": 3350.41, "total_tokens": 203173328} +{"current_steps": 167085, "total_steps": 179580, "loss": 0.8597, "lr": 7.338622720772071e-07, "epoch": 18.608419645840293, "percentage": 93.04, "elapsed_time": "16:50:43", "remaining_time": "1:15:35", "throughput": 3350.42, "total_tokens": 203179472} +{"current_steps": 167090, "total_steps": 179580, "loss": 0.7983, "lr": 7.332779991558652e-07, "epoch": 18.608976500723912, "percentage": 93.04, "elapsed_time": "16:50:44", "remaining_time": "1:15:33", "throughput": 3350.42, "total_tokens": 203185552} +{"current_steps": 167095, "total_steps": 179580, "loss": 0.8628, "lr": 7.326939554531509e-07, "epoch": 18.609533355607528, "percentage": 93.05, "elapsed_time": "16:50:46", "remaining_time": "1:15:31", "throughput": 3350.42, "total_tokens": 203191344} +{"current_steps": 167100, "total_steps": 179580, "loss": 0.6355, "lr": 7.321101409745846e-07, "epoch": 18.610090210491148, "percentage": 93.05, "elapsed_time": "16:50:48", "remaining_time": "1:15:29", "throughput": 3350.42, "total_tokens": 203196656} +{"current_steps": 167105, "total_steps": 179580, "loss": 0.5954, "lr": 7.315265557256839e-07, "epoch": 18.610647065374764, "percentage": 93.05, "elapsed_time": "16:50:49", "remaining_time": "1:15:27", "throughput": 3350.43, "total_tokens": 203202992} +{"current_steps": 167110, "total_steps": 179580, "loss": 0.6852, "lr": 7.309431997119532e-07, "epoch": 18.61120392025838, "percentage": 93.06, "elapsed_time": "16:50:51", "remaining_time": "1:15:25", "throughput": 3350.43, "total_tokens": 203209328} +{"current_steps": 167115, "total_steps": 179580, "loss": 0.6488, "lr": 7.303600729389127e-07, "epoch": 18.611760775142, "percentage": 93.06, "elapsed_time": "16:50:53", "remaining_time": "1:15:24", "throughput": 3350.44, "total_tokens": 203215440} +{"current_steps": 167120, "total_steps": 179580, "loss": 0.7242, "lr": 7.297771754120664e-07, "epoch": 18.612317630025615, "percentage": 93.06, "elapsed_time": "16:50:55", "remaining_time": "1:15:22", "throughput": 3350.44, "total_tokens": 203221520} +{"current_steps": 167125, "total_steps": 179580, "loss": 0.6326, "lr": 7.291945071369182e-07, "epoch": 18.612874484909234, "percentage": 93.06, "elapsed_time": "16:50:56", "remaining_time": "1:15:20", "throughput": 3350.44, "total_tokens": 203227792} +{"current_steps": 167130, "total_steps": 179580, "loss": 0.9112, "lr": 7.286120681189723e-07, "epoch": 18.61343133979285, "percentage": 93.07, "elapsed_time": "16:50:58", "remaining_time": "1:15:18", "throughput": 3350.44, "total_tokens": 203234064} +{"current_steps": 167135, "total_steps": 179580, "loss": 0.7212, "lr": 7.280298583637324e-07, "epoch": 18.613988194676466, "percentage": 93.07, "elapsed_time": "16:51:00", "remaining_time": "1:15:16", "throughput": 3350.45, "total_tokens": 203240240} +{"current_steps": 167140, "total_steps": 179580, "loss": 0.6938, "lr": 7.274478778766968e-07, "epoch": 18.614545049560085, "percentage": 93.07, "elapsed_time": "16:51:02", "remaining_time": "1:15:15", "throughput": 3350.45, "total_tokens": 203246384} +{"current_steps": 167145, "total_steps": 179580, "loss": 0.6592, "lr": 7.268661266633641e-07, "epoch": 18.6151019044437, "percentage": 93.08, "elapsed_time": "16:51:04", "remaining_time": "1:15:13", "throughput": 3350.45, "total_tokens": 203252528} +{"current_steps": 167150, "total_steps": 179580, "loss": 0.7105, "lr": 7.262846047292243e-07, "epoch": 18.61565875932732, "percentage": 93.08, "elapsed_time": "16:51:05", "remaining_time": "1:15:11", "throughput": 3350.45, "total_tokens": 203258544} +{"current_steps": 167155, "total_steps": 179580, "loss": 0.7016, "lr": 7.257033120797757e-07, "epoch": 18.616215614210937, "percentage": 93.08, "elapsed_time": "16:51:07", "remaining_time": "1:15:09", "throughput": 3350.46, "total_tokens": 203264720} +{"current_steps": 167160, "total_steps": 179580, "loss": 0.6451, "lr": 7.251222487205083e-07, "epoch": 18.616772469094553, "percentage": 93.08, "elapsed_time": "16:51:09", "remaining_time": "1:15:07", "throughput": 3350.46, "total_tokens": 203270928} +{"current_steps": 167165, "total_steps": 179580, "loss": 0.8051, "lr": 7.245414146569124e-07, "epoch": 18.617329323978172, "percentage": 93.09, "elapsed_time": "16:51:11", "remaining_time": "1:15:05", "throughput": 3350.46, "total_tokens": 203277040} +{"current_steps": 167170, "total_steps": 179580, "loss": 0.5034, "lr": 7.239608098944694e-07, "epoch": 18.617886178861788, "percentage": 93.09, "elapsed_time": "16:51:13", "remaining_time": "1:15:04", "throughput": 3350.47, "total_tokens": 203283280} +{"current_steps": 167175, "total_steps": 179580, "loss": 0.4966, "lr": 7.233804344386669e-07, "epoch": 18.618443033745407, "percentage": 93.09, "elapsed_time": "16:51:14", "remaining_time": "1:15:02", "throughput": 3350.47, "total_tokens": 203289584} +{"current_steps": 167180, "total_steps": 179580, "loss": 0.5652, "lr": 7.228002882949835e-07, "epoch": 18.618999888629023, "percentage": 93.09, "elapsed_time": "16:51:16", "remaining_time": "1:15:00", "throughput": 3350.47, "total_tokens": 203295216} +{"current_steps": 167185, "total_steps": 179580, "loss": 0.8348, "lr": 7.222203714689041e-07, "epoch": 18.61955674351264, "percentage": 93.1, "elapsed_time": "16:51:18", "remaining_time": "1:14:58", "throughput": 3350.48, "total_tokens": 203301424} +{"current_steps": 167190, "total_steps": 179580, "loss": 0.6187, "lr": 7.216406839659073e-07, "epoch": 18.62011359839626, "percentage": 93.1, "elapsed_time": "16:51:20", "remaining_time": "1:14:56", "throughput": 3350.48, "total_tokens": 203307632} +{"current_steps": 167195, "total_steps": 179580, "loss": 0.8804, "lr": 7.21061225791464e-07, "epoch": 18.620670453279875, "percentage": 93.1, "elapsed_time": "16:51:21", "remaining_time": "1:14:55", "throughput": 3350.48, "total_tokens": 203313904} +{"current_steps": 167200, "total_steps": 179580, "loss": 0.8111, "lr": 7.204819969510446e-07, "epoch": 18.621227308163494, "percentage": 93.11, "elapsed_time": "16:51:23", "remaining_time": "1:14:53", "throughput": 3350.49, "total_tokens": 203319728} +{"current_steps": 167205, "total_steps": 179580, "loss": 0.696, "lr": 7.199029974501309e-07, "epoch": 18.62178416304711, "percentage": 93.11, "elapsed_time": "16:51:25", "remaining_time": "1:14:51", "throughput": 3350.49, "total_tokens": 203326032} +{"current_steps": 167210, "total_steps": 179580, "loss": 0.7563, "lr": 7.193242272941853e-07, "epoch": 18.622341017930726, "percentage": 93.11, "elapsed_time": "16:51:27", "remaining_time": "1:14:49", "throughput": 3350.49, "total_tokens": 203332336} +{"current_steps": 167215, "total_steps": 179580, "loss": 0.8878, "lr": 7.187456864886755e-07, "epoch": 18.622897872814345, "percentage": 93.11, "elapsed_time": "16:51:28", "remaining_time": "1:14:47", "throughput": 3350.5, "total_tokens": 203338096} +{"current_steps": 167220, "total_steps": 179580, "loss": 0.7435, "lr": 7.181673750390639e-07, "epoch": 18.62345472769796, "percentage": 93.12, "elapsed_time": "16:51:30", "remaining_time": "1:14:45", "throughput": 3350.5, "total_tokens": 203343856} +{"current_steps": 167225, "total_steps": 179580, "loss": 0.8691, "lr": 7.175892929508182e-07, "epoch": 18.62401158258158, "percentage": 93.12, "elapsed_time": "16:51:32", "remaining_time": "1:14:44", "throughput": 3350.5, "total_tokens": 203349872} +{"current_steps": 167230, "total_steps": 179580, "loss": 0.6868, "lr": 7.170114402293926e-07, "epoch": 18.624568437465197, "percentage": 93.12, "elapsed_time": "16:51:34", "remaining_time": "1:14:42", "throughput": 3350.5, "total_tokens": 203355984} +{"current_steps": 167235, "total_steps": 179580, "loss": 0.9433, "lr": 7.164338168802576e-07, "epoch": 18.625125292348812, "percentage": 93.13, "elapsed_time": "16:51:35", "remaining_time": "1:14:40", "throughput": 3350.51, "total_tokens": 203361616} +{"current_steps": 167240, "total_steps": 179580, "loss": 0.8357, "lr": 7.158564229088532e-07, "epoch": 18.625682147232432, "percentage": 93.13, "elapsed_time": "16:51:37", "remaining_time": "1:14:38", "throughput": 3350.51, "total_tokens": 203367856} +{"current_steps": 167245, "total_steps": 179580, "loss": 0.583, "lr": 7.152792583206447e-07, "epoch": 18.626239002116048, "percentage": 93.13, "elapsed_time": "16:51:39", "remaining_time": "1:14:36", "throughput": 3350.52, "total_tokens": 203374224} +{"current_steps": 167250, "total_steps": 179580, "loss": 0.7859, "lr": 7.147023231210748e-07, "epoch": 18.626795856999667, "percentage": 93.13, "elapsed_time": "16:51:41", "remaining_time": "1:14:35", "throughput": 3350.52, "total_tokens": 203380272} +{"current_steps": 167255, "total_steps": 179580, "loss": 0.5007, "lr": 7.141256173156058e-07, "epoch": 18.627352711883283, "percentage": 93.14, "elapsed_time": "16:51:42", "remaining_time": "1:14:33", "throughput": 3350.52, "total_tokens": 203386480} +{"current_steps": 167260, "total_steps": 179580, "loss": 0.9698, "lr": 7.13549140909675e-07, "epoch": 18.6279095667669, "percentage": 93.14, "elapsed_time": "16:51:44", "remaining_time": "1:14:31", "throughput": 3350.53, "total_tokens": 203393200} +{"current_steps": 167265, "total_steps": 179580, "loss": 0.5973, "lr": 7.129728939087311e-07, "epoch": 18.62846642165052, "percentage": 93.14, "elapsed_time": "16:51:46", "remaining_time": "1:14:29", "throughput": 3350.53, "total_tokens": 203399664} +{"current_steps": 167270, "total_steps": 179580, "loss": 0.8095, "lr": 7.123968763182137e-07, "epoch": 18.629023276534134, "percentage": 93.15, "elapsed_time": "16:51:48", "remaining_time": "1:14:27", "throughput": 3350.53, "total_tokens": 203405456} +{"current_steps": 167275, "total_steps": 179580, "loss": 0.8073, "lr": 7.118210881435689e-07, "epoch": 18.629580131417754, "percentage": 93.15, "elapsed_time": "16:51:50", "remaining_time": "1:14:25", "throughput": 3350.54, "total_tokens": 203411568} +{"current_steps": 167280, "total_steps": 179580, "loss": 1.0091, "lr": 7.112455293902337e-07, "epoch": 18.63013698630137, "percentage": 93.15, "elapsed_time": "16:51:51", "remaining_time": "1:14:24", "throughput": 3350.54, "total_tokens": 203417552} +{"current_steps": 167285, "total_steps": 179580, "loss": 0.7553, "lr": 7.106702000636456e-07, "epoch": 18.630693841184986, "percentage": 93.15, "elapsed_time": "16:51:53", "remaining_time": "1:14:22", "throughput": 3350.54, "total_tokens": 203423920} +{"current_steps": 167290, "total_steps": 179580, "loss": 1.0707, "lr": 7.100951001692336e-07, "epoch": 18.631250696068605, "percentage": 93.16, "elapsed_time": "16:51:55", "remaining_time": "1:14:20", "throughput": 3350.55, "total_tokens": 203429936} +{"current_steps": 167295, "total_steps": 179580, "loss": 0.593, "lr": 7.095202297124376e-07, "epoch": 18.63180755095222, "percentage": 93.16, "elapsed_time": "16:51:57", "remaining_time": "1:14:18", "throughput": 3350.55, "total_tokens": 203435664} +{"current_steps": 167300, "total_steps": 179580, "loss": 0.6762, "lr": 7.089455886986813e-07, "epoch": 18.63236440583584, "percentage": 93.16, "elapsed_time": "16:51:58", "remaining_time": "1:14:16", "throughput": 3350.55, "total_tokens": 203441968} +{"current_steps": 167305, "total_steps": 179580, "loss": 0.6051, "lr": 7.083711771333989e-07, "epoch": 18.632921260719456, "percentage": 93.16, "elapsed_time": "16:52:00", "remaining_time": "1:14:15", "throughput": 3350.56, "total_tokens": 203448112} +{"current_steps": 167310, "total_steps": 179580, "loss": 0.9014, "lr": 7.077969950220115e-07, "epoch": 18.633478115603072, "percentage": 93.17, "elapsed_time": "16:52:02", "remaining_time": "1:14:13", "throughput": 3350.56, "total_tokens": 203454448} +{"current_steps": 167315, "total_steps": 179580, "loss": 0.669, "lr": 7.072230423699422e-07, "epoch": 18.63403497048669, "percentage": 93.17, "elapsed_time": "16:52:04", "remaining_time": "1:14:11", "throughput": 3350.57, "total_tokens": 203460880} +{"current_steps": 167320, "total_steps": 179580, "loss": 0.8111, "lr": 7.066493191826146e-07, "epoch": 18.634591825370308, "percentage": 93.17, "elapsed_time": "16:52:06", "remaining_time": "1:14:09", "throughput": 3350.57, "total_tokens": 203467088} +{"current_steps": 167325, "total_steps": 179580, "loss": 0.5792, "lr": 7.060758254654492e-07, "epoch": 18.635148680253927, "percentage": 93.18, "elapsed_time": "16:52:07", "remaining_time": "1:14:07", "throughput": 3350.57, "total_tokens": 203473296} +{"current_steps": 167330, "total_steps": 179580, "loss": 0.6482, "lr": 7.055025612238642e-07, "epoch": 18.635705535137543, "percentage": 93.18, "elapsed_time": "16:52:09", "remaining_time": "1:14:05", "throughput": 3350.58, "total_tokens": 203479152} +{"current_steps": 167335, "total_steps": 179580, "loss": 0.8397, "lr": 7.049295264632689e-07, "epoch": 18.63626239002116, "percentage": 93.18, "elapsed_time": "16:52:11", "remaining_time": "1:14:04", "throughput": 3350.58, "total_tokens": 203485104} +{"current_steps": 167340, "total_steps": 179580, "loss": 0.5594, "lr": 7.043567211890784e-07, "epoch": 18.63681924490478, "percentage": 93.18, "elapsed_time": "16:52:13", "remaining_time": "1:14:02", "throughput": 3350.58, "total_tokens": 203491312} +{"current_steps": 167345, "total_steps": 179580, "loss": 0.7817, "lr": 7.037841454067051e-07, "epoch": 18.637376099788394, "percentage": 93.19, "elapsed_time": "16:52:14", "remaining_time": "1:14:00", "throughput": 3350.58, "total_tokens": 203497232} +{"current_steps": 167350, "total_steps": 179580, "loss": 0.716, "lr": 7.032117991215587e-07, "epoch": 18.637932954672014, "percentage": 93.19, "elapsed_time": "16:52:16", "remaining_time": "1:13:58", "throughput": 3350.59, "total_tokens": 203503184} +{"current_steps": 167355, "total_steps": 179580, "loss": 0.6975, "lr": 7.026396823390402e-07, "epoch": 18.63848980955563, "percentage": 93.19, "elapsed_time": "16:52:18", "remaining_time": "1:13:56", "throughput": 3350.59, "total_tokens": 203509552} +{"current_steps": 167360, "total_steps": 179580, "loss": 0.8155, "lr": 7.020677950645566e-07, "epoch": 18.63904666443925, "percentage": 93.2, "elapsed_time": "16:52:20", "remaining_time": "1:13:55", "throughput": 3350.59, "total_tokens": 203515024} +{"current_steps": 167365, "total_steps": 179580, "loss": 0.7368, "lr": 7.014961373035089e-07, "epoch": 18.639603519322865, "percentage": 93.2, "elapsed_time": "16:52:21", "remaining_time": "1:13:53", "throughput": 3350.6, "total_tokens": 203521264} +{"current_steps": 167370, "total_steps": 179580, "loss": 0.6553, "lr": 7.009247090612986e-07, "epoch": 18.64016037420648, "percentage": 93.2, "elapsed_time": "16:52:23", "remaining_time": "1:13:51", "throughput": 3350.6, "total_tokens": 203527248} +{"current_steps": 167375, "total_steps": 179580, "loss": 0.4489, "lr": 7.00353510343324e-07, "epoch": 18.6407172290901, "percentage": 93.2, "elapsed_time": "16:52:25", "remaining_time": "1:13:49", "throughput": 3350.6, "total_tokens": 203533296} +{"current_steps": 167380, "total_steps": 179580, "loss": 0.9575, "lr": 6.99782541154978e-07, "epoch": 18.641274083973716, "percentage": 93.21, "elapsed_time": "16:52:27", "remaining_time": "1:13:47", "throughput": 3350.6, "total_tokens": 203539504} +{"current_steps": 167385, "total_steps": 179580, "loss": 0.7284, "lr": 6.992118015016564e-07, "epoch": 18.641830938857332, "percentage": 93.21, "elapsed_time": "16:52:28", "remaining_time": "1:13:45", "throughput": 3350.61, "total_tokens": 203545488} +{"current_steps": 167390, "total_steps": 179580, "loss": 0.5647, "lr": 6.986412913887463e-07, "epoch": 18.64238779374095, "percentage": 93.21, "elapsed_time": "16:52:30", "remaining_time": "1:13:44", "throughput": 3350.61, "total_tokens": 203551664} +{"current_steps": 167395, "total_steps": 179580, "loss": 0.7792, "lr": 6.980710108216409e-07, "epoch": 18.642944648624567, "percentage": 93.21, "elapsed_time": "16:52:32", "remaining_time": "1:13:42", "throughput": 3350.61, "total_tokens": 203557776} +{"current_steps": 167400, "total_steps": 179580, "loss": 0.8588, "lr": 6.975009598057247e-07, "epoch": 18.643501503508187, "percentage": 93.22, "elapsed_time": "16:52:34", "remaining_time": "1:13:40", "throughput": 3350.62, "total_tokens": 203563856} +{"current_steps": 167405, "total_steps": 179580, "loss": 0.6918, "lr": 6.96931138346385e-07, "epoch": 18.644058358391803, "percentage": 93.22, "elapsed_time": "16:52:35", "remaining_time": "1:13:38", "throughput": 3350.62, "total_tokens": 203569296} +{"current_steps": 167410, "total_steps": 179580, "loss": 0.6144, "lr": 6.96361546448998e-07, "epoch": 18.644615213275422, "percentage": 93.22, "elapsed_time": "16:52:37", "remaining_time": "1:13:36", "throughput": 3350.62, "total_tokens": 203575440} +{"current_steps": 167415, "total_steps": 179580, "loss": 0.9157, "lr": 6.957921841189485e-07, "epoch": 18.645172068159038, "percentage": 93.23, "elapsed_time": "16:52:39", "remaining_time": "1:13:35", "throughput": 3350.63, "total_tokens": 203581936} +{"current_steps": 167420, "total_steps": 179580, "loss": 0.8258, "lr": 6.952230513616182e-07, "epoch": 18.645728923042654, "percentage": 93.23, "elapsed_time": "16:52:41", "remaining_time": "1:13:33", "throughput": 3350.63, "total_tokens": 203588144} +{"current_steps": 167425, "total_steps": 179580, "loss": 0.7545, "lr": 6.946541481823749e-07, "epoch": 18.646285777926273, "percentage": 93.23, "elapsed_time": "16:52:42", "remaining_time": "1:13:31", "throughput": 3350.63, "total_tokens": 203593776} +{"current_steps": 167430, "total_steps": 179580, "loss": 0.4453, "lr": 6.940854745865977e-07, "epoch": 18.64684263280989, "percentage": 93.23, "elapsed_time": "16:52:44", "remaining_time": "1:13:29", "throughput": 3350.64, "total_tokens": 203599920} +{"current_steps": 167435, "total_steps": 179580, "loss": 0.5538, "lr": 6.935170305796546e-07, "epoch": 18.64739948769351, "percentage": 93.24, "elapsed_time": "16:52:46", "remaining_time": "1:13:27", "throughput": 3350.64, "total_tokens": 203605744} +{"current_steps": 167440, "total_steps": 179580, "loss": 0.8782, "lr": 6.929488161669217e-07, "epoch": 18.647956342577125, "percentage": 93.24, "elapsed_time": "16:52:48", "remaining_time": "1:13:25", "throughput": 3350.65, "total_tokens": 203612432} +{"current_steps": 167445, "total_steps": 179580, "loss": 0.7318, "lr": 6.923808313537561e-07, "epoch": 18.64851319746074, "percentage": 93.24, "elapsed_time": "16:52:49", "remaining_time": "1:13:24", "throughput": 3350.65, "total_tokens": 203618192} +{"current_steps": 167450, "total_steps": 179580, "loss": 0.6564, "lr": 6.918130761455338e-07, "epoch": 18.64907005234436, "percentage": 93.25, "elapsed_time": "16:52:51", "remaining_time": "1:13:22", "throughput": 3350.65, "total_tokens": 203624400} +{"current_steps": 167455, "total_steps": 179580, "loss": 0.6742, "lr": 6.91245550547609e-07, "epoch": 18.649626907227976, "percentage": 93.25, "elapsed_time": "16:52:53", "remaining_time": "1:13:20", "throughput": 3350.65, "total_tokens": 203630352} +{"current_steps": 167460, "total_steps": 179580, "loss": 0.6355, "lr": 6.906782545653467e-07, "epoch": 18.650183762111595, "percentage": 93.25, "elapsed_time": "16:52:55", "remaining_time": "1:13:18", "throughput": 3350.66, "total_tokens": 203636144} +{"current_steps": 167465, "total_steps": 179580, "loss": 0.7558, "lr": 6.901111882041039e-07, "epoch": 18.65074061699521, "percentage": 93.25, "elapsed_time": "16:52:56", "remaining_time": "1:13:16", "throughput": 3350.66, "total_tokens": 203642512} +{"current_steps": 167470, "total_steps": 179580, "loss": 0.6853, "lr": 6.895443514692374e-07, "epoch": 18.651297471878827, "percentage": 93.26, "elapsed_time": "16:52:58", "remaining_time": "1:13:14", "throughput": 3350.66, "total_tokens": 203648496} +{"current_steps": 167475, "total_steps": 179580, "loss": 0.7521, "lr": 6.889777443661039e-07, "epoch": 18.651854326762447, "percentage": 93.26, "elapsed_time": "16:53:00", "remaining_time": "1:13:13", "throughput": 3350.67, "total_tokens": 203654544} +{"current_steps": 167480, "total_steps": 179580, "loss": 0.6001, "lr": 6.884113669000547e-07, "epoch": 18.652411181646062, "percentage": 93.26, "elapsed_time": "16:53:02", "remaining_time": "1:13:11", "throughput": 3350.67, "total_tokens": 203660720} +{"current_steps": 167485, "total_steps": 179580, "loss": 0.7396, "lr": 6.878452190764329e-07, "epoch": 18.652968036529682, "percentage": 93.26, "elapsed_time": "16:53:03", "remaining_time": "1:13:09", "throughput": 3350.67, "total_tokens": 203666672} +{"current_steps": 167490, "total_steps": 179580, "loss": 0.7362, "lr": 6.872793009005951e-07, "epoch": 18.653524891413298, "percentage": 93.27, "elapsed_time": "16:53:05", "remaining_time": "1:13:07", "throughput": 3350.68, "total_tokens": 203672848} +{"current_steps": 167495, "total_steps": 179580, "loss": 0.9369, "lr": 6.867136123778817e-07, "epoch": 18.654081746296914, "percentage": 93.27, "elapsed_time": "16:53:07", "remaining_time": "1:13:05", "throughput": 3350.68, "total_tokens": 203678576} +{"current_steps": 167500, "total_steps": 179580, "loss": 0.7826, "lr": 6.861481535136411e-07, "epoch": 18.654638601180533, "percentage": 93.27, "elapsed_time": "16:53:09", "remaining_time": "1:13:04", "throughput": 3350.68, "total_tokens": 203684624} +{"current_steps": 167505, "total_steps": 179580, "loss": 0.6214, "lr": 6.85582924313205e-07, "epoch": 18.65519545606415, "percentage": 93.28, "elapsed_time": "16:53:10", "remaining_time": "1:13:02", "throughput": 3350.68, "total_tokens": 203690480} +{"current_steps": 167510, "total_steps": 179580, "loss": 0.8305, "lr": 6.850179247819249e-07, "epoch": 18.65575231094777, "percentage": 93.28, "elapsed_time": "16:53:12", "remaining_time": "1:13:00", "throughput": 3350.69, "total_tokens": 203696624} +{"current_steps": 167515, "total_steps": 179580, "loss": 0.6197, "lr": 6.84453154925127e-07, "epoch": 18.656309165831384, "percentage": 93.28, "elapsed_time": "16:53:14", "remaining_time": "1:12:58", "throughput": 3350.69, "total_tokens": 203702192} +{"current_steps": 167520, "total_steps": 179580, "loss": 0.6894, "lr": 6.838886147481516e-07, "epoch": 18.656866020715, "percentage": 93.28, "elapsed_time": "16:53:15", "remaining_time": "1:12:56", "throughput": 3350.69, "total_tokens": 203708368} +{"current_steps": 167525, "total_steps": 179580, "loss": 0.5446, "lr": 6.833243042563303e-07, "epoch": 18.65742287559862, "percentage": 93.29, "elapsed_time": "16:53:17", "remaining_time": "1:12:54", "throughput": 3350.7, "total_tokens": 203714480} +{"current_steps": 167530, "total_steps": 179580, "loss": 0.8359, "lr": 6.827602234549952e-07, "epoch": 18.657979730482236, "percentage": 93.29, "elapsed_time": "16:53:19", "remaining_time": "1:12:53", "throughput": 3350.7, "total_tokens": 203720496} +{"current_steps": 167535, "total_steps": 179580, "loss": 0.6506, "lr": 6.821963723494667e-07, "epoch": 18.658536585365855, "percentage": 93.29, "elapsed_time": "16:53:21", "remaining_time": "1:12:51", "throughput": 3350.7, "total_tokens": 203726512} +{"current_steps": 167540, "total_steps": 179580, "loss": 0.522, "lr": 6.816327509450826e-07, "epoch": 18.65909344024947, "percentage": 93.3, "elapsed_time": "16:53:22", "remaining_time": "1:12:49", "throughput": 3350.71, "total_tokens": 203732784} +{"current_steps": 167545, "total_steps": 179580, "loss": 0.5684, "lr": 6.810693592471579e-07, "epoch": 18.659650295133087, "percentage": 93.3, "elapsed_time": "16:53:24", "remaining_time": "1:12:47", "throughput": 3350.71, "total_tokens": 203739024} +{"current_steps": 167550, "total_steps": 179580, "loss": 0.6108, "lr": 6.805061972610188e-07, "epoch": 18.660207150016706, "percentage": 93.3, "elapsed_time": "16:53:26", "remaining_time": "1:12:45", "throughput": 3350.71, "total_tokens": 203745200} +{"current_steps": 167555, "total_steps": 179580, "loss": 0.8528, "lr": 6.799432649919807e-07, "epoch": 18.660764004900322, "percentage": 93.3, "elapsed_time": "16:53:28", "remaining_time": "1:12:44", "throughput": 3350.72, "total_tokens": 203751248} +{"current_steps": 167560, "total_steps": 179580, "loss": 0.7549, "lr": 6.793805624453642e-07, "epoch": 18.66132085978394, "percentage": 93.31, "elapsed_time": "16:53:30", "remaining_time": "1:12:42", "throughput": 3350.72, "total_tokens": 203757264} +{"current_steps": 167565, "total_steps": 179580, "loss": 0.6801, "lr": 6.788180896264817e-07, "epoch": 18.661877714667558, "percentage": 93.31, "elapsed_time": "16:53:31", "remaining_time": "1:12:40", "throughput": 3350.72, "total_tokens": 203763312} +{"current_steps": 167570, "total_steps": 179580, "loss": 0.6719, "lr": 6.782558465406541e-07, "epoch": 18.662434569551174, "percentage": 93.31, "elapsed_time": "16:53:33", "remaining_time": "1:12:38", "throughput": 3350.72, "total_tokens": 203769424} +{"current_steps": 167575, "total_steps": 179580, "loss": 0.5508, "lr": 6.776938331931825e-07, "epoch": 18.662991424434793, "percentage": 93.31, "elapsed_time": "16:53:35", "remaining_time": "1:12:36", "throughput": 3350.73, "total_tokens": 203775408} +{"current_steps": 167580, "total_steps": 179580, "loss": 0.8498, "lr": 6.771320495893796e-07, "epoch": 18.66354827931841, "percentage": 93.32, "elapsed_time": "16:53:37", "remaining_time": "1:12:34", "throughput": 3350.73, "total_tokens": 203781648} +{"current_steps": 167585, "total_steps": 179580, "loss": 0.6832, "lr": 6.765704957345492e-07, "epoch": 18.66410513420203, "percentage": 93.32, "elapsed_time": "16:53:38", "remaining_time": "1:12:33", "throughput": 3350.74, "total_tokens": 203787952} +{"current_steps": 167590, "total_steps": 179580, "loss": 0.5473, "lr": 6.760091716340011e-07, "epoch": 18.664661989085644, "percentage": 93.32, "elapsed_time": "16:53:40", "remaining_time": "1:12:31", "throughput": 3350.74, "total_tokens": 203794128} +{"current_steps": 167595, "total_steps": 179580, "loss": 0.8994, "lr": 6.754480772930338e-07, "epoch": 18.66521884396926, "percentage": 93.33, "elapsed_time": "16:53:42", "remaining_time": "1:12:29", "throughput": 3350.74, "total_tokens": 203800080} +{"current_steps": 167600, "total_steps": 179580, "loss": 0.6662, "lr": 6.748872127169487e-07, "epoch": 18.66577569885288, "percentage": 93.33, "elapsed_time": "16:53:44", "remaining_time": "1:12:27", "throughput": 3350.75, "total_tokens": 203805808} +{"current_steps": 167605, "total_steps": 179580, "loss": 0.7567, "lr": 6.743265779110413e-07, "epoch": 18.666332553736495, "percentage": 93.33, "elapsed_time": "16:53:45", "remaining_time": "1:12:25", "throughput": 3350.75, "total_tokens": 203811664} +{"current_steps": 167610, "total_steps": 179580, "loss": 0.8168, "lr": 6.737661728806105e-07, "epoch": 18.666889408620115, "percentage": 93.33, "elapsed_time": "16:53:47", "remaining_time": "1:12:24", "throughput": 3350.75, "total_tokens": 203817104} +{"current_steps": 167615, "total_steps": 179580, "loss": 0.8948, "lr": 6.732059976309463e-07, "epoch": 18.66744626350373, "percentage": 93.34, "elapsed_time": "16:53:49", "remaining_time": "1:12:22", "throughput": 3350.75, "total_tokens": 203823184} +{"current_steps": 167620, "total_steps": 179580, "loss": 0.6898, "lr": 6.726460521673445e-07, "epoch": 18.668003118387347, "percentage": 93.34, "elapsed_time": "16:53:50", "remaining_time": "1:12:20", "throughput": 3350.76, "total_tokens": 203829424} +{"current_steps": 167625, "total_steps": 179580, "loss": 0.6282, "lr": 6.720863364950869e-07, "epoch": 18.668559973270966, "percentage": 93.34, "elapsed_time": "16:53:52", "remaining_time": "1:12:18", "throughput": 3350.76, "total_tokens": 203835312} +{"current_steps": 167630, "total_steps": 179580, "loss": 0.7387, "lr": 6.715268506194694e-07, "epoch": 18.669116828154582, "percentage": 93.35, "elapsed_time": "16:53:54", "remaining_time": "1:12:16", "throughput": 3350.76, "total_tokens": 203841264} +{"current_steps": 167635, "total_steps": 179580, "loss": 0.5872, "lr": 6.709675945457683e-07, "epoch": 18.6696736830382, "percentage": 93.35, "elapsed_time": "16:53:56", "remaining_time": "1:12:14", "throughput": 3350.76, "total_tokens": 203847408} +{"current_steps": 167640, "total_steps": 179580, "loss": 0.8043, "lr": 6.704085682792765e-07, "epoch": 18.670230537921817, "percentage": 93.35, "elapsed_time": "16:53:57", "remaining_time": "1:12:13", "throughput": 3350.77, "total_tokens": 203853552} +{"current_steps": 167645, "total_steps": 179580, "loss": 0.8753, "lr": 6.698497718252622e-07, "epoch": 18.670787392805433, "percentage": 93.35, "elapsed_time": "16:53:59", "remaining_time": "1:12:11", "throughput": 3350.77, "total_tokens": 203859632} +{"current_steps": 167650, "total_steps": 179580, "loss": 0.8454, "lr": 6.692912051890127e-07, "epoch": 18.671344247689053, "percentage": 93.36, "elapsed_time": "16:54:01", "remaining_time": "1:12:09", "throughput": 3350.78, "total_tokens": 203866352} +{"current_steps": 167655, "total_steps": 179580, "loss": 0.6466, "lr": 6.687328683757987e-07, "epoch": 18.67190110257267, "percentage": 93.36, "elapsed_time": "16:54:03", "remaining_time": "1:12:07", "throughput": 3350.78, "total_tokens": 203872560} +{"current_steps": 167660, "total_steps": 179580, "loss": 0.8515, "lr": 6.681747613908995e-07, "epoch": 18.672457957456288, "percentage": 93.36, "elapsed_time": "16:54:05", "remaining_time": "1:12:05", "throughput": 3350.78, "total_tokens": 203878512} +{"current_steps": 167665, "total_steps": 179580, "loss": 0.5593, "lr": 6.67616884239583e-07, "epoch": 18.673014812339904, "percentage": 93.37, "elapsed_time": "16:54:06", "remaining_time": "1:12:04", "throughput": 3350.79, "total_tokens": 203884432} +{"current_steps": 167670, "total_steps": 179580, "loss": 0.7161, "lr": 6.670592369271229e-07, "epoch": 18.67357166722352, "percentage": 93.37, "elapsed_time": "16:54:08", "remaining_time": "1:12:02", "throughput": 3350.79, "total_tokens": 203890480} +{"current_steps": 167675, "total_steps": 179580, "loss": 0.7822, "lr": 6.665018194587786e-07, "epoch": 18.67412852210714, "percentage": 93.37, "elapsed_time": "16:54:10", "remaining_time": "1:12:00", "throughput": 3350.79, "total_tokens": 203896304} +{"current_steps": 167680, "total_steps": 179580, "loss": 0.7329, "lr": 6.659446318398211e-07, "epoch": 18.674685376990755, "percentage": 93.37, "elapsed_time": "16:54:11", "remaining_time": "1:11:58", "throughput": 3350.8, "total_tokens": 203902480} +{"current_steps": 167685, "total_steps": 179580, "loss": 0.5668, "lr": 6.653876740755155e-07, "epoch": 18.675242231874375, "percentage": 93.38, "elapsed_time": "16:54:13", "remaining_time": "1:11:56", "throughput": 3350.8, "total_tokens": 203908752} +{"current_steps": 167690, "total_steps": 179580, "loss": 0.9594, "lr": 6.648309461711189e-07, "epoch": 18.67579908675799, "percentage": 93.38, "elapsed_time": "16:54:15", "remaining_time": "1:11:54", "throughput": 3350.8, "total_tokens": 203914768} +{"current_steps": 167695, "total_steps": 179580, "loss": 0.7218, "lr": 6.64274448131888e-07, "epoch": 18.676355941641607, "percentage": 93.38, "elapsed_time": "16:54:17", "remaining_time": "1:11:53", "throughput": 3350.81, "total_tokens": 203920944} +{"current_steps": 167700, "total_steps": 179580, "loss": 0.6823, "lr": 6.637181799630854e-07, "epoch": 18.676912796525226, "percentage": 93.38, "elapsed_time": "16:54:19", "remaining_time": "1:11:51", "throughput": 3350.81, "total_tokens": 203927120} +{"current_steps": 167705, "total_steps": 179580, "loss": 0.8918, "lr": 6.631621416699596e-07, "epoch": 18.677469651408842, "percentage": 93.39, "elapsed_time": "16:54:20", "remaining_time": "1:11:49", "throughput": 3350.81, "total_tokens": 203933392} +{"current_steps": 167710, "total_steps": 179580, "loss": 0.6303, "lr": 6.626063332577704e-07, "epoch": 18.67802650629246, "percentage": 93.39, "elapsed_time": "16:54:22", "remaining_time": "1:11:47", "throughput": 3350.82, "total_tokens": 203939664} +{"current_steps": 167715, "total_steps": 179580, "loss": 0.8569, "lr": 6.620507547317606e-07, "epoch": 18.678583361176077, "percentage": 93.39, "elapsed_time": "16:54:24", "remaining_time": "1:11:45", "throughput": 3350.82, "total_tokens": 203945680} +{"current_steps": 167720, "total_steps": 179580, "loss": 0.5832, "lr": 6.614954060971818e-07, "epoch": 18.679140216059693, "percentage": 93.4, "elapsed_time": "16:54:26", "remaining_time": "1:11:44", "throughput": 3350.82, "total_tokens": 203951856} +{"current_steps": 167725, "total_steps": 179580, "loss": 0.5967, "lr": 6.60940287359274e-07, "epoch": 18.679697070943313, "percentage": 93.4, "elapsed_time": "16:54:27", "remaining_time": "1:11:42", "throughput": 3350.83, "total_tokens": 203957968} +{"current_steps": 167730, "total_steps": 179580, "loss": 0.6025, "lr": 6.603853985232916e-07, "epoch": 18.68025392582693, "percentage": 93.4, "elapsed_time": "16:54:29", "remaining_time": "1:11:40", "throughput": 3350.83, "total_tokens": 203964112} +{"current_steps": 167735, "total_steps": 179580, "loss": 0.7099, "lr": 6.598307395944664e-07, "epoch": 18.680810780710548, "percentage": 93.4, "elapsed_time": "16:54:31", "remaining_time": "1:11:38", "throughput": 3350.83, "total_tokens": 203970320} +{"current_steps": 167740, "total_steps": 179580, "loss": 0.6421, "lr": 6.592763105780442e-07, "epoch": 18.681367635594164, "percentage": 93.41, "elapsed_time": "16:54:33", "remaining_time": "1:11:36", "throughput": 3350.84, "total_tokens": 203976752} +{"current_steps": 167745, "total_steps": 179580, "loss": 0.7354, "lr": 6.587221114792513e-07, "epoch": 18.681924490477783, "percentage": 93.41, "elapsed_time": "16:54:35", "remaining_time": "1:11:34", "throughput": 3350.84, "total_tokens": 203982960} +{"current_steps": 167750, "total_steps": 179580, "loss": 0.7081, "lr": 6.581681423033364e-07, "epoch": 18.6824813453614, "percentage": 93.41, "elapsed_time": "16:54:36", "remaining_time": "1:11:33", "throughput": 3350.85, "total_tokens": 203988944} +{"current_steps": 167755, "total_steps": 179580, "loss": 0.6501, "lr": 6.576144030555259e-07, "epoch": 18.683038200245015, "percentage": 93.42, "elapsed_time": "16:54:38", "remaining_time": "1:11:31", "throughput": 3350.85, "total_tokens": 203994768} +{"current_steps": 167760, "total_steps": 179580, "loss": 0.611, "lr": 6.570608937410488e-07, "epoch": 18.683595055128634, "percentage": 93.42, "elapsed_time": "16:54:40", "remaining_time": "1:11:29", "throughput": 3350.85, "total_tokens": 204001232} +{"current_steps": 167765, "total_steps": 179580, "loss": 0.8894, "lr": 6.565076143651316e-07, "epoch": 18.68415191001225, "percentage": 93.42, "elapsed_time": "16:54:42", "remaining_time": "1:11:27", "throughput": 3350.86, "total_tokens": 204007344} +{"current_steps": 167770, "total_steps": 179580, "loss": 0.9319, "lr": 6.559545649330062e-07, "epoch": 18.68470876489587, "percentage": 93.42, "elapsed_time": "16:54:43", "remaining_time": "1:11:25", "throughput": 3350.86, "total_tokens": 204012880} +{"current_steps": 167775, "total_steps": 179580, "loss": 0.5464, "lr": 6.554017454498934e-07, "epoch": 18.685265619779486, "percentage": 93.43, "elapsed_time": "16:54:45", "remaining_time": "1:11:24", "throughput": 3350.86, "total_tokens": 204018928} +{"current_steps": 167780, "total_steps": 179580, "loss": 0.7507, "lr": 6.548491559210168e-07, "epoch": 18.6858224746631, "percentage": 93.43, "elapsed_time": "16:54:47", "remaining_time": "1:11:22", "throughput": 3350.87, "total_tokens": 204024368} +{"current_steps": 167785, "total_steps": 179580, "loss": 0.6186, "lr": 6.542967963515944e-07, "epoch": 18.68637932954672, "percentage": 93.43, "elapsed_time": "16:54:48", "remaining_time": "1:11:20", "throughput": 3350.87, "total_tokens": 204030064} +{"current_steps": 167790, "total_steps": 179580, "loss": 0.6772, "lr": 6.537446667468472e-07, "epoch": 18.686936184430337, "percentage": 93.43, "elapsed_time": "16:54:50", "remaining_time": "1:11:18", "throughput": 3350.87, "total_tokens": 204036080} +{"current_steps": 167795, "total_steps": 179580, "loss": 0.7244, "lr": 6.53192767111982e-07, "epoch": 18.687493039313956, "percentage": 93.44, "elapsed_time": "16:54:52", "remaining_time": "1:11:16", "throughput": 3350.87, "total_tokens": 204041968} +{"current_steps": 167800, "total_steps": 179580, "loss": 0.6911, "lr": 6.526410974522196e-07, "epoch": 18.688049894197572, "percentage": 93.44, "elapsed_time": "16:54:53", "remaining_time": "1:11:14", "throughput": 3350.88, "total_tokens": 204047952} +{"current_steps": 167805, "total_steps": 179580, "loss": 0.6526, "lr": 6.520896577727698e-07, "epoch": 18.68860674908119, "percentage": 93.44, "elapsed_time": "16:54:55", "remaining_time": "1:11:13", "throughput": 3350.88, "total_tokens": 204054256} +{"current_steps": 167810, "total_steps": 179580, "loss": 1.077, "lr": 6.515384480788422e-07, "epoch": 18.689163603964808, "percentage": 93.45, "elapsed_time": "16:54:57", "remaining_time": "1:11:11", "throughput": 3350.88, "total_tokens": 204060368} +{"current_steps": 167815, "total_steps": 179580, "loss": 0.5744, "lr": 6.509874683756384e-07, "epoch": 18.689720458848424, "percentage": 93.45, "elapsed_time": "16:54:59", "remaining_time": "1:11:09", "throughput": 3350.89, "total_tokens": 204066576} +{"current_steps": 167820, "total_steps": 179580, "loss": 0.6299, "lr": 6.504367186683652e-07, "epoch": 18.690277313732043, "percentage": 93.45, "elapsed_time": "16:55:00", "remaining_time": "1:11:07", "throughput": 3350.89, "total_tokens": 204072624} +{"current_steps": 167825, "total_steps": 179580, "loss": 0.7882, "lr": 6.498861989622268e-07, "epoch": 18.69083416861566, "percentage": 93.45, "elapsed_time": "16:55:02", "remaining_time": "1:11:05", "throughput": 3350.9, "total_tokens": 204078608} +{"current_steps": 167830, "total_steps": 179580, "loss": 0.5742, "lr": 6.493359092624274e-07, "epoch": 18.691391023499275, "percentage": 93.46, "elapsed_time": "16:55:04", "remaining_time": "1:11:04", "throughput": 3350.9, "total_tokens": 204084688} +{"current_steps": 167835, "total_steps": 179580, "loss": 0.7499, "lr": 6.487858495741545e-07, "epoch": 18.691947878382894, "percentage": 93.46, "elapsed_time": "16:55:06", "remaining_time": "1:11:02", "throughput": 3350.9, "total_tokens": 204090896} +{"current_steps": 167840, "total_steps": 179580, "loss": 0.6102, "lr": 6.482360199026094e-07, "epoch": 18.69250473326651, "percentage": 93.46, "elapsed_time": "16:55:08", "remaining_time": "1:11:00", "throughput": 3350.91, "total_tokens": 204097200} +{"current_steps": 167845, "total_steps": 179580, "loss": 0.8169, "lr": 6.476864202529853e-07, "epoch": 18.69306158815013, "percentage": 93.47, "elapsed_time": "16:55:09", "remaining_time": "1:10:58", "throughput": 3350.91, "total_tokens": 204103280} +{"current_steps": 167850, "total_steps": 179580, "loss": 0.6919, "lr": 6.471370506304725e-07, "epoch": 18.693618443033746, "percentage": 93.47, "elapsed_time": "16:55:11", "remaining_time": "1:10:56", "throughput": 3350.91, "total_tokens": 204109488} +{"current_steps": 167855, "total_steps": 179580, "loss": 0.8303, "lr": 6.465879110402667e-07, "epoch": 18.69417529791736, "percentage": 93.47, "elapsed_time": "16:55:13", "remaining_time": "1:10:54", "throughput": 3350.91, "total_tokens": 204114800} +{"current_steps": 167860, "total_steps": 179580, "loss": 0.859, "lr": 6.460390014875445e-07, "epoch": 18.69473215280098, "percentage": 93.47, "elapsed_time": "16:55:14", "remaining_time": "1:10:53", "throughput": 3350.92, "total_tokens": 204120144} +{"current_steps": 167865, "total_steps": 179580, "loss": 0.5708, "lr": 6.454903219774988e-07, "epoch": 18.695289007684597, "percentage": 93.48, "elapsed_time": "16:55:16", "remaining_time": "1:10:51", "throughput": 3350.92, "total_tokens": 204126320} +{"current_steps": 167870, "total_steps": 179580, "loss": 0.656, "lr": 6.449418725153062e-07, "epoch": 18.695845862568216, "percentage": 93.48, "elapsed_time": "16:55:18", "remaining_time": "1:10:49", "throughput": 3350.92, "total_tokens": 204132240} +{"current_steps": 167875, "total_steps": 179580, "loss": 0.808, "lr": 6.44393653106154e-07, "epoch": 18.696402717451832, "percentage": 93.48, "elapsed_time": "16:55:20", "remaining_time": "1:10:47", "throughput": 3350.93, "total_tokens": 204138576} +{"current_steps": 167880, "total_steps": 179580, "loss": 0.8102, "lr": 6.43845663755216e-07, "epoch": 18.696959572335448, "percentage": 93.48, "elapsed_time": "16:55:21", "remaining_time": "1:10:45", "throughput": 3350.93, "total_tokens": 204144784} +{"current_steps": 167885, "total_steps": 179580, "loss": 0.4874, "lr": 6.432979044676712e-07, "epoch": 18.697516427219067, "percentage": 93.49, "elapsed_time": "16:55:23", "remaining_time": "1:10:43", "throughput": 3350.94, "total_tokens": 204150576} +{"current_steps": 167890, "total_steps": 179580, "loss": 0.6345, "lr": 6.42750375248688e-07, "epoch": 18.698073282102683, "percentage": 93.49, "elapsed_time": "16:55:25", "remaining_time": "1:10:42", "throughput": 3350.94, "total_tokens": 204156592} +{"current_steps": 167895, "total_steps": 179580, "loss": 0.7078, "lr": 6.422030761034453e-07, "epoch": 18.698630136986303, "percentage": 93.49, "elapsed_time": "16:55:26", "remaining_time": "1:10:40", "throughput": 3350.94, "total_tokens": 204162800} +{"current_steps": 167900, "total_steps": 179580, "loss": 0.7356, "lr": 6.416560070371114e-07, "epoch": 18.69918699186992, "percentage": 93.5, "elapsed_time": "16:55:28", "remaining_time": "1:10:38", "throughput": 3350.95, "total_tokens": 204169168} +{"current_steps": 167905, "total_steps": 179580, "loss": 0.6757, "lr": 6.411091680548487e-07, "epoch": 18.699743846753535, "percentage": 93.5, "elapsed_time": "16:55:30", "remaining_time": "1:10:36", "throughput": 3350.95, "total_tokens": 204175440} +{"current_steps": 167910, "total_steps": 179580, "loss": 1.0908, "lr": 6.405625591618253e-07, "epoch": 18.700300701637154, "percentage": 93.5, "elapsed_time": "16:55:32", "remaining_time": "1:10:34", "throughput": 3350.95, "total_tokens": 204181552} +{"current_steps": 167915, "total_steps": 179580, "loss": 0.8819, "lr": 6.400161803632065e-07, "epoch": 18.70085755652077, "percentage": 93.5, "elapsed_time": "16:55:34", "remaining_time": "1:10:33", "throughput": 3350.96, "total_tokens": 204187632} +{"current_steps": 167920, "total_steps": 179580, "loss": 0.7078, "lr": 6.394700316641522e-07, "epoch": 18.70141441140439, "percentage": 93.51, "elapsed_time": "16:55:35", "remaining_time": "1:10:31", "throughput": 3350.96, "total_tokens": 204193872} +{"current_steps": 167925, "total_steps": 179580, "loss": 0.5792, "lr": 6.389241130698193e-07, "epoch": 18.701971266288005, "percentage": 93.51, "elapsed_time": "16:55:37", "remaining_time": "1:10:29", "throughput": 3350.96, "total_tokens": 204199792} +{"current_steps": 167930, "total_steps": 179580, "loss": 0.7956, "lr": 6.383784245853674e-07, "epoch": 18.70252812117162, "percentage": 93.51, "elapsed_time": "16:55:39", "remaining_time": "1:10:27", "throughput": 3350.97, "total_tokens": 204205904} +{"current_steps": 167935, "total_steps": 179580, "loss": 0.9277, "lr": 6.37832966215951e-07, "epoch": 18.70308497605524, "percentage": 93.52, "elapsed_time": "16:55:41", "remaining_time": "1:10:25", "throughput": 3350.97, "total_tokens": 204211856} +{"current_steps": 167940, "total_steps": 179580, "loss": 0.5938, "lr": 6.372877379667159e-07, "epoch": 18.703641830938857, "percentage": 93.52, "elapsed_time": "16:55:42", "remaining_time": "1:10:23", "throughput": 3350.97, "total_tokens": 204218096} +{"current_steps": 167945, "total_steps": 179580, "loss": 0.836, "lr": 6.367427398428216e-07, "epoch": 18.704198685822476, "percentage": 93.52, "elapsed_time": "16:55:44", "remaining_time": "1:10:22", "throughput": 3350.98, "total_tokens": 204224400} +{"current_steps": 167950, "total_steps": 179580, "loss": 0.757, "lr": 6.361979718494115e-07, "epoch": 18.704755540706092, "percentage": 93.52, "elapsed_time": "16:55:46", "remaining_time": "1:10:20", "throughput": 3350.98, "total_tokens": 204230832} +{"current_steps": 167955, "total_steps": 179580, "loss": 0.7574, "lr": 6.356534339916315e-07, "epoch": 18.705312395589708, "percentage": 93.53, "elapsed_time": "16:55:48", "remaining_time": "1:10:18", "throughput": 3350.98, "total_tokens": 204236336} +{"current_steps": 167960, "total_steps": 179580, "loss": 0.7353, "lr": 6.351091262746217e-07, "epoch": 18.705869250473327, "percentage": 93.53, "elapsed_time": "16:55:49", "remaining_time": "1:10:16", "throughput": 3350.99, "total_tokens": 204242640} +{"current_steps": 167965, "total_steps": 179580, "loss": 0.9422, "lr": 6.345650487035309e-07, "epoch": 18.706426105356943, "percentage": 93.53, "elapsed_time": "16:55:51", "remaining_time": "1:10:14", "throughput": 3350.99, "total_tokens": 204248720} +{"current_steps": 167970, "total_steps": 179580, "loss": 0.8477, "lr": 6.340212012834912e-07, "epoch": 18.706982960240563, "percentage": 93.53, "elapsed_time": "16:55:53", "remaining_time": "1:10:13", "throughput": 3350.99, "total_tokens": 204254672} +{"current_steps": 167975, "total_steps": 179580, "loss": 0.9576, "lr": 6.334775840196483e-07, "epoch": 18.70753981512418, "percentage": 93.54, "elapsed_time": "16:55:55", "remaining_time": "1:10:11", "throughput": 3351.0, "total_tokens": 204260880} +{"current_steps": 167980, "total_steps": 179580, "loss": 0.6768, "lr": 6.32934196917126e-07, "epoch": 18.708096670007794, "percentage": 93.54, "elapsed_time": "16:55:57", "remaining_time": "1:10:09", "throughput": 3351.0, "total_tokens": 204267216} +{"current_steps": 167985, "total_steps": 179580, "loss": 0.788, "lr": 6.323910399810646e-07, "epoch": 18.708653524891414, "percentage": 93.54, "elapsed_time": "16:55:58", "remaining_time": "1:10:07", "throughput": 3351.0, "total_tokens": 204273424} +{"current_steps": 167990, "total_steps": 179580, "loss": 0.6397, "lr": 6.318481132165904e-07, "epoch": 18.70921037977503, "percentage": 93.55, "elapsed_time": "16:56:00", "remaining_time": "1:10:05", "throughput": 3351.01, "total_tokens": 204279728} +{"current_steps": 167995, "total_steps": 179580, "loss": 0.8489, "lr": 6.313054166288385e-07, "epoch": 18.70976723465865, "percentage": 93.55, "elapsed_time": "16:56:02", "remaining_time": "1:10:03", "throughput": 3351.01, "total_tokens": 204285904} +{"current_steps": 168000, "total_steps": 179580, "loss": 0.5957, "lr": 6.307629502229296e-07, "epoch": 18.710324089542265, "percentage": 93.55, "elapsed_time": "16:56:04", "remaining_time": "1:10:02", "throughput": 3351.02, "total_tokens": 204292176} +{"current_steps": 168005, "total_steps": 179580, "loss": 0.845, "lr": 6.3022071400399e-07, "epoch": 18.71088094442588, "percentage": 93.55, "elapsed_time": "16:56:06", "remaining_time": "1:10:00", "throughput": 3351.02, "total_tokens": 204298224} +{"current_steps": 168010, "total_steps": 179580, "loss": 0.6363, "lr": 6.296787079771382e-07, "epoch": 18.7114377993095, "percentage": 93.56, "elapsed_time": "16:56:07", "remaining_time": "1:09:58", "throughput": 3351.02, "total_tokens": 204304592} +{"current_steps": 168015, "total_steps": 179580, "loss": 0.5948, "lr": 6.291369321474977e-07, "epoch": 18.711994654193116, "percentage": 93.56, "elapsed_time": "16:56:09", "remaining_time": "1:09:56", "throughput": 3351.03, "total_tokens": 204310800} +{"current_steps": 168020, "total_steps": 179580, "loss": 0.8917, "lr": 6.285953865201838e-07, "epoch": 18.712551509076736, "percentage": 93.56, "elapsed_time": "16:56:11", "remaining_time": "1:09:54", "throughput": 3351.03, "total_tokens": 204317008} +{"current_steps": 168025, "total_steps": 179580, "loss": 0.7458, "lr": 6.280540711003119e-07, "epoch": 18.71310836396035, "percentage": 93.57, "elapsed_time": "16:56:13", "remaining_time": "1:09:53", "throughput": 3351.03, "total_tokens": 204323440} +{"current_steps": 168030, "total_steps": 179580, "loss": 0.6303, "lr": 6.275129858929946e-07, "epoch": 18.713665218843968, "percentage": 93.57, "elapsed_time": "16:56:14", "remaining_time": "1:09:51", "throughput": 3351.03, "total_tokens": 204329104} +{"current_steps": 168035, "total_steps": 179580, "loss": 0.6187, "lr": 6.269721309033472e-07, "epoch": 18.714222073727587, "percentage": 93.57, "elapsed_time": "16:56:16", "remaining_time": "1:09:49", "throughput": 3351.04, "total_tokens": 204335120} +{"current_steps": 168040, "total_steps": 179580, "loss": 0.7338, "lr": 6.264315061364739e-07, "epoch": 18.714778928611203, "percentage": 93.57, "elapsed_time": "16:56:18", "remaining_time": "1:09:47", "throughput": 3351.04, "total_tokens": 204340880} +{"current_steps": 168045, "total_steps": 179580, "loss": 0.554, "lr": 6.258911115974847e-07, "epoch": 18.715335783494822, "percentage": 93.58, "elapsed_time": "16:56:20", "remaining_time": "1:09:45", "throughput": 3351.04, "total_tokens": 204347024} +{"current_steps": 168050, "total_steps": 179580, "loss": 0.7756, "lr": 6.253509472914781e-07, "epoch": 18.71589263837844, "percentage": 93.58, "elapsed_time": "16:56:21", "remaining_time": "1:09:43", "throughput": 3351.05, "total_tokens": 204353040} +{"current_steps": 168055, "total_steps": 179580, "loss": 0.8443, "lr": 6.24811013223564e-07, "epoch": 18.716449493262054, "percentage": 93.58, "elapsed_time": "16:56:23", "remaining_time": "1:09:42", "throughput": 3351.05, "total_tokens": 204359056} +{"current_steps": 168060, "total_steps": 179580, "loss": 0.5887, "lr": 6.242713093988356e-07, "epoch": 18.717006348145674, "percentage": 93.59, "elapsed_time": "16:56:25", "remaining_time": "1:09:40", "throughput": 3351.05, "total_tokens": 204365360} +{"current_steps": 168065, "total_steps": 179580, "loss": 0.7715, "lr": 6.23731835822397e-07, "epoch": 18.71756320302929, "percentage": 93.59, "elapsed_time": "16:56:27", "remaining_time": "1:09:38", "throughput": 3351.06, "total_tokens": 204371056} +{"current_steps": 168070, "total_steps": 179580, "loss": 1.153, "lr": 6.231925924993415e-07, "epoch": 18.71812005791291, "percentage": 93.59, "elapsed_time": "16:56:28", "remaining_time": "1:09:36", "throughput": 3351.06, "total_tokens": 204377200} +{"current_steps": 168075, "total_steps": 179580, "loss": 0.6811, "lr": 6.226535794347622e-07, "epoch": 18.718676912796525, "percentage": 93.59, "elapsed_time": "16:56:30", "remaining_time": "1:09:34", "throughput": 3351.06, "total_tokens": 204383536} +{"current_steps": 168080, "total_steps": 179580, "loss": 0.5544, "lr": 6.221147966337492e-07, "epoch": 18.719233767680144, "percentage": 93.6, "elapsed_time": "16:56:32", "remaining_time": "1:09:33", "throughput": 3351.07, "total_tokens": 204389424} +{"current_steps": 168085, "total_steps": 179580, "loss": 0.809, "lr": 6.215762441013934e-07, "epoch": 18.71979062256376, "percentage": 93.6, "elapsed_time": "16:56:34", "remaining_time": "1:09:31", "throughput": 3351.07, "total_tokens": 204395504} +{"current_steps": 168090, "total_steps": 179580, "loss": 0.4591, "lr": 6.21037921842782e-07, "epoch": 18.720347477447376, "percentage": 93.6, "elapsed_time": "16:56:35", "remaining_time": "1:09:29", "throughput": 3351.07, "total_tokens": 204401520} +{"current_steps": 168095, "total_steps": 179580, "loss": 0.8338, "lr": 6.204998298629999e-07, "epoch": 18.720904332330996, "percentage": 93.6, "elapsed_time": "16:56:37", "remaining_time": "1:09:27", "throughput": 3351.08, "total_tokens": 204407696} +{"current_steps": 168100, "total_steps": 179580, "loss": 0.5985, "lr": 6.199619681671292e-07, "epoch": 18.72146118721461, "percentage": 93.61, "elapsed_time": "16:56:39", "remaining_time": "1:09:25", "throughput": 3351.08, "total_tokens": 204413968} +{"current_steps": 168105, "total_steps": 179580, "loss": 0.6137, "lr": 6.194243367602493e-07, "epoch": 18.722018042098227, "percentage": 93.61, "elapsed_time": "16:56:41", "remaining_time": "1:09:23", "throughput": 3351.09, "total_tokens": 204420144} +{"current_steps": 168110, "total_steps": 179580, "loss": 0.6141, "lr": 6.188869356474391e-07, "epoch": 18.722574896981847, "percentage": 93.61, "elapsed_time": "16:56:42", "remaining_time": "1:09:22", "throughput": 3351.09, "total_tokens": 204426128} +{"current_steps": 168115, "total_steps": 179580, "loss": 0.8119, "lr": 6.183497648337811e-07, "epoch": 18.723131751865463, "percentage": 93.62, "elapsed_time": "16:56:44", "remaining_time": "1:09:20", "throughput": 3351.09, "total_tokens": 204431920} +{"current_steps": 168120, "total_steps": 179580, "loss": 0.6739, "lr": 6.178128243243403e-07, "epoch": 18.723688606749082, "percentage": 93.62, "elapsed_time": "16:56:46", "remaining_time": "1:09:18", "throughput": 3351.1, "total_tokens": 204438096} +{"current_steps": 168125, "total_steps": 179580, "loss": 0.5419, "lr": 6.172761141241934e-07, "epoch": 18.724245461632698, "percentage": 93.62, "elapsed_time": "16:56:48", "remaining_time": "1:09:16", "throughput": 3351.1, "total_tokens": 204444144} +{"current_steps": 168130, "total_steps": 179580, "loss": 0.6025, "lr": 6.167396342384057e-07, "epoch": 18.724802316516318, "percentage": 93.62, "elapsed_time": "16:56:49", "remaining_time": "1:09:14", "throughput": 3351.1, "total_tokens": 204449008} +{"current_steps": 168135, "total_steps": 179580, "loss": 0.8528, "lr": 6.162033846720483e-07, "epoch": 18.725359171399933, "percentage": 93.63, "elapsed_time": "16:56:51", "remaining_time": "1:09:13", "throughput": 3351.1, "total_tokens": 204454768} +{"current_steps": 168140, "total_steps": 179580, "loss": 0.8224, "lr": 6.156673654301892e-07, "epoch": 18.72591602628355, "percentage": 93.63, "elapsed_time": "16:56:52", "remaining_time": "1:09:11", "throughput": 3351.11, "total_tokens": 204460240} +{"current_steps": 168145, "total_steps": 179580, "loss": 0.5824, "lr": 6.151315765178855e-07, "epoch": 18.72647288116717, "percentage": 93.63, "elapsed_time": "16:56:54", "remaining_time": "1:09:09", "throughput": 3351.11, "total_tokens": 204466512} +{"current_steps": 168150, "total_steps": 179580, "loss": 0.595, "lr": 6.145960179402e-07, "epoch": 18.727029736050785, "percentage": 93.64, "elapsed_time": "16:56:56", "remaining_time": "1:09:07", "throughput": 3351.11, "total_tokens": 204472464} +{"current_steps": 168155, "total_steps": 179580, "loss": 0.6318, "lr": 6.14060689702195e-07, "epoch": 18.727586590934404, "percentage": 93.64, "elapsed_time": "16:56:58", "remaining_time": "1:09:05", "throughput": 3351.11, "total_tokens": 204478544} +{"current_steps": 168160, "total_steps": 179580, "loss": 0.6982, "lr": 6.135255918089222e-07, "epoch": 18.72814344581802, "percentage": 93.64, "elapsed_time": "16:56:59", "remaining_time": "1:09:03", "throughput": 3351.12, "total_tokens": 204484336} +{"current_steps": 168165, "total_steps": 179580, "loss": 0.6996, "lr": 6.129907242654415e-07, "epoch": 18.728700300701636, "percentage": 93.64, "elapsed_time": "16:57:01", "remaining_time": "1:09:02", "throughput": 3351.12, "total_tokens": 204490640} +{"current_steps": 168170, "total_steps": 179580, "loss": 0.6151, "lr": 6.124560870767987e-07, "epoch": 18.729257155585255, "percentage": 93.65, "elapsed_time": "16:57:03", "remaining_time": "1:09:00", "throughput": 3351.12, "total_tokens": 204496528} +{"current_steps": 168175, "total_steps": 179580, "loss": 0.9456, "lr": 6.119216802480482e-07, "epoch": 18.72981401046887, "percentage": 93.65, "elapsed_time": "16:57:04", "remaining_time": "1:08:58", "throughput": 3351.13, "total_tokens": 204502448} +{"current_steps": 168180, "total_steps": 179580, "loss": 0.8692, "lr": 6.113875037842359e-07, "epoch": 18.73037086535249, "percentage": 93.65, "elapsed_time": "16:57:06", "remaining_time": "1:08:56", "throughput": 3351.13, "total_tokens": 204508592} +{"current_steps": 168185, "total_steps": 179580, "loss": 0.6428, "lr": 6.108535576904107e-07, "epoch": 18.730927720236107, "percentage": 93.65, "elapsed_time": "16:57:08", "remaining_time": "1:08:54", "throughput": 3351.13, "total_tokens": 204514672} +{"current_steps": 168190, "total_steps": 179580, "loss": 0.5973, "lr": 6.103198419716127e-07, "epoch": 18.731484575119723, "percentage": 93.66, "elapsed_time": "16:57:10", "remaining_time": "1:08:53", "throughput": 3351.14, "total_tokens": 204520464} +{"current_steps": 168195, "total_steps": 179580, "loss": 0.7885, "lr": 6.097863566328854e-07, "epoch": 18.732041430003342, "percentage": 93.66, "elapsed_time": "16:57:11", "remaining_time": "1:08:51", "throughput": 3351.14, "total_tokens": 204526512} +{"current_steps": 168200, "total_steps": 179580, "loss": 0.7061, "lr": 6.092531016792635e-07, "epoch": 18.732598284886958, "percentage": 93.66, "elapsed_time": "16:57:13", "remaining_time": "1:08:49", "throughput": 3351.14, "total_tokens": 204532656} +{"current_steps": 168205, "total_steps": 179580, "loss": 0.9688, "lr": 6.087200771157931e-07, "epoch": 18.733155139770577, "percentage": 93.67, "elapsed_time": "16:57:15", "remaining_time": "1:08:47", "throughput": 3351.15, "total_tokens": 204538864} +{"current_steps": 168210, "total_steps": 179580, "loss": 0.657, "lr": 6.081872829475005e-07, "epoch": 18.733711994654193, "percentage": 93.67, "elapsed_time": "16:57:17", "remaining_time": "1:08:45", "throughput": 3351.15, "total_tokens": 204544880} +{"current_steps": 168215, "total_steps": 179580, "loss": 0.5663, "lr": 6.076547191794207e-07, "epoch": 18.73426884953781, "percentage": 93.67, "elapsed_time": "16:57:19", "remaining_time": "1:08:43", "throughput": 3351.15, "total_tokens": 204551056} +{"current_steps": 168220, "total_steps": 179580, "loss": 0.6414, "lr": 6.071223858165859e-07, "epoch": 18.73482570442143, "percentage": 93.67, "elapsed_time": "16:57:20", "remaining_time": "1:08:42", "throughput": 3351.15, "total_tokens": 204556976} +{"current_steps": 168225, "total_steps": 179580, "loss": 0.9765, "lr": 6.065902828640225e-07, "epoch": 18.735382559305044, "percentage": 93.68, "elapsed_time": "16:57:22", "remaining_time": "1:08:40", "throughput": 3351.16, "total_tokens": 204563088} +{"current_steps": 168230, "total_steps": 179580, "loss": 0.8503, "lr": 6.06058410326757e-07, "epoch": 18.735939414188664, "percentage": 93.68, "elapsed_time": "16:57:24", "remaining_time": "1:08:38", "throughput": 3351.16, "total_tokens": 204569264} +{"current_steps": 168235, "total_steps": 179580, "loss": 0.7447, "lr": 6.055267682098187e-07, "epoch": 18.73649626907228, "percentage": 93.68, "elapsed_time": "16:57:26", "remaining_time": "1:08:36", "throughput": 3351.16, "total_tokens": 204575568} +{"current_steps": 168240, "total_steps": 179580, "loss": 0.6695, "lr": 6.049953565182231e-07, "epoch": 18.737053123955896, "percentage": 93.69, "elapsed_time": "16:57:27", "remaining_time": "1:08:34", "throughput": 3351.17, "total_tokens": 204581520} +{"current_steps": 168245, "total_steps": 179580, "loss": 0.8291, "lr": 6.044641752569857e-07, "epoch": 18.737609978839515, "percentage": 93.69, "elapsed_time": "16:57:29", "remaining_time": "1:08:33", "throughput": 3351.17, "total_tokens": 204587472} +{"current_steps": 168250, "total_steps": 179580, "loss": 0.6914, "lr": 6.039332244311357e-07, "epoch": 18.73816683372313, "percentage": 93.69, "elapsed_time": "16:57:31", "remaining_time": "1:08:31", "throughput": 3351.17, "total_tokens": 204593520} +{"current_steps": 168255, "total_steps": 179580, "loss": 0.5184, "lr": 6.034025040456775e-07, "epoch": 18.73872368860675, "percentage": 93.69, "elapsed_time": "16:57:33", "remaining_time": "1:08:29", "throughput": 3351.17, "total_tokens": 204599568} +{"current_steps": 168260, "total_steps": 179580, "loss": 0.7745, "lr": 6.028720141056349e-07, "epoch": 18.739280543490366, "percentage": 93.7, "elapsed_time": "16:57:34", "remaining_time": "1:08:27", "throughput": 3351.18, "total_tokens": 204605872} +{"current_steps": 168265, "total_steps": 179580, "loss": 0.6544, "lr": 6.023417546160065e-07, "epoch": 18.739837398373982, "percentage": 93.7, "elapsed_time": "16:57:36", "remaining_time": "1:08:25", "throughput": 3351.18, "total_tokens": 204612240} +{"current_steps": 168270, "total_steps": 179580, "loss": 0.6337, "lr": 6.018117255818106e-07, "epoch": 18.7403942532576, "percentage": 93.7, "elapsed_time": "16:57:38", "remaining_time": "1:08:23", "throughput": 3351.18, "total_tokens": 204618608} +{"current_steps": 168275, "total_steps": 179580, "loss": 0.4368, "lr": 6.012819270080461e-07, "epoch": 18.740951108141218, "percentage": 93.7, "elapsed_time": "16:57:40", "remaining_time": "1:08:22", "throughput": 3351.19, "total_tokens": 204624848} +{"current_steps": 168280, "total_steps": 179580, "loss": 0.7638, "lr": 6.007523588997282e-07, "epoch": 18.741507963024837, "percentage": 93.71, "elapsed_time": "16:57:42", "remaining_time": "1:08:20", "throughput": 3351.2, "total_tokens": 204631024} +{"current_steps": 168285, "total_steps": 179580, "loss": 1.1583, "lr": 6.002230212618503e-07, "epoch": 18.742064817908453, "percentage": 93.71, "elapsed_time": "16:57:43", "remaining_time": "1:08:18", "throughput": 3351.2, "total_tokens": 204637360} +{"current_steps": 168290, "total_steps": 179580, "loss": 0.7631, "lr": 5.99693914099414e-07, "epoch": 18.74262167279207, "percentage": 93.71, "elapsed_time": "16:57:45", "remaining_time": "1:08:16", "throughput": 3351.2, "total_tokens": 204643472} +{"current_steps": 168295, "total_steps": 179580, "loss": 0.6479, "lr": 5.991650374174151e-07, "epoch": 18.74317852767569, "percentage": 93.72, "elapsed_time": "16:57:47", "remaining_time": "1:08:14", "throughput": 3351.21, "total_tokens": 204649520} +{"current_steps": 168300, "total_steps": 179580, "loss": 0.6754, "lr": 5.986363912208582e-07, "epoch": 18.743735382559304, "percentage": 93.72, "elapsed_time": "16:57:49", "remaining_time": "1:08:13", "throughput": 3351.21, "total_tokens": 204655856} +{"current_steps": 168305, "total_steps": 179580, "loss": 0.7627, "lr": 5.981079755147279e-07, "epoch": 18.744292237442924, "percentage": 93.72, "elapsed_time": "16:57:50", "remaining_time": "1:08:11", "throughput": 3351.22, "total_tokens": 204662000} +{"current_steps": 168310, "total_steps": 179580, "loss": 0.7195, "lr": 5.975797903040176e-07, "epoch": 18.74484909232654, "percentage": 93.72, "elapsed_time": "16:57:52", "remaining_time": "1:08:09", "throughput": 3351.22, "total_tokens": 204668080} +{"current_steps": 168315, "total_steps": 179580, "loss": 0.6184, "lr": 5.970518355937149e-07, "epoch": 18.745405947210156, "percentage": 93.73, "elapsed_time": "16:57:54", "remaining_time": "1:08:07", "throughput": 3351.22, "total_tokens": 204673648} +{"current_steps": 168320, "total_steps": 179580, "loss": 0.8528, "lr": 5.965241113888131e-07, "epoch": 18.745962802093775, "percentage": 93.73, "elapsed_time": "16:57:56", "remaining_time": "1:08:05", "throughput": 3351.22, "total_tokens": 204679184} +{"current_steps": 168325, "total_steps": 179580, "loss": 0.7022, "lr": 5.959966176942889e-07, "epoch": 18.74651965697739, "percentage": 93.73, "elapsed_time": "16:57:57", "remaining_time": "1:08:03", "throughput": 3351.22, "total_tokens": 204685040} +{"current_steps": 168330, "total_steps": 179580, "loss": 0.7478, "lr": 5.954693545151296e-07, "epoch": 18.74707651186101, "percentage": 93.74, "elapsed_time": "16:57:59", "remaining_time": "1:08:02", "throughput": 3351.22, "total_tokens": 204691408} +{"current_steps": 168335, "total_steps": 179580, "loss": 0.6984, "lr": 5.949423218563177e-07, "epoch": 18.747633366744626, "percentage": 93.74, "elapsed_time": "16:58:01", "remaining_time": "1:08:00", "throughput": 3351.22, "total_tokens": 204697520} +{"current_steps": 168340, "total_steps": 179580, "loss": 0.9561, "lr": 5.944155197228268e-07, "epoch": 18.748190221628242, "percentage": 93.74, "elapsed_time": "16:58:03", "remaining_time": "1:07:58", "throughput": 3351.23, "total_tokens": 204704048} +{"current_steps": 168345, "total_steps": 179580, "loss": 0.8616, "lr": 5.938889481196335e-07, "epoch": 18.74874707651186, "percentage": 93.74, "elapsed_time": "16:58:05", "remaining_time": "1:07:56", "throughput": 3351.23, "total_tokens": 204710000} +{"current_steps": 168350, "total_steps": 179580, "loss": 0.8103, "lr": 5.933626070517145e-07, "epoch": 18.749303931395477, "percentage": 93.75, "elapsed_time": "16:58:06", "remaining_time": "1:07:54", "throughput": 3351.23, "total_tokens": 204716144} +{"current_steps": 168355, "total_steps": 179580, "loss": 0.7874, "lr": 5.928364965240408e-07, "epoch": 18.749860786279097, "percentage": 93.75, "elapsed_time": "16:58:08", "remaining_time": "1:07:53", "throughput": 3351.24, "total_tokens": 204722256} +{"current_steps": 168360, "total_steps": 179580, "loss": 1.1945, "lr": 5.923106165415831e-07, "epoch": 18.750417641162713, "percentage": 93.75, "elapsed_time": "16:58:10", "remaining_time": "1:07:51", "throughput": 3351.24, "total_tokens": 204728784} +{"current_steps": 168365, "total_steps": 179580, "loss": 0.8011, "lr": 5.917849671093018e-07, "epoch": 18.75097449604633, "percentage": 93.75, "elapsed_time": "16:58:12", "remaining_time": "1:07:49", "throughput": 3351.25, "total_tokens": 204734992} +{"current_steps": 168370, "total_steps": 179580, "loss": 1.0329, "lr": 5.912595482321676e-07, "epoch": 18.751531350929948, "percentage": 93.76, "elapsed_time": "16:58:14", "remaining_time": "1:07:47", "throughput": 3351.25, "total_tokens": 204741456} +{"current_steps": 168375, "total_steps": 179580, "loss": 0.6781, "lr": 5.907343599151432e-07, "epoch": 18.752088205813564, "percentage": 93.76, "elapsed_time": "16:58:15", "remaining_time": "1:07:45", "throughput": 3351.25, "total_tokens": 204747760} +{"current_steps": 168380, "total_steps": 179580, "loss": 0.643, "lr": 5.902094021631943e-07, "epoch": 18.752645060697184, "percentage": 93.76, "elapsed_time": "16:58:17", "remaining_time": "1:07:43", "throughput": 3351.26, "total_tokens": 204753968} +{"current_steps": 168385, "total_steps": 179580, "loss": 1.029, "lr": 5.896846749812667e-07, "epoch": 18.7532019155808, "percentage": 93.77, "elapsed_time": "16:58:19", "remaining_time": "1:07:42", "throughput": 3351.26, "total_tokens": 204760112} +{"current_steps": 168390, "total_steps": 179580, "loss": 0.9707, "lr": 5.891601783743289e-07, "epoch": 18.753758770464415, "percentage": 93.77, "elapsed_time": "16:58:21", "remaining_time": "1:07:40", "throughput": 3351.26, "total_tokens": 204765968} +{"current_steps": 168395, "total_steps": 179580, "loss": 0.5915, "lr": 5.886359123473295e-07, "epoch": 18.754315625348035, "percentage": 93.77, "elapsed_time": "16:58:22", "remaining_time": "1:07:38", "throughput": 3351.27, "total_tokens": 204772080} +{"current_steps": 168400, "total_steps": 179580, "loss": 0.728, "lr": 5.88111876905223e-07, "epoch": 18.75487248023165, "percentage": 93.77, "elapsed_time": "16:58:24", "remaining_time": "1:07:36", "throughput": 3351.27, "total_tokens": 204778128} +{"current_steps": 168405, "total_steps": 179580, "loss": 0.554, "lr": 5.875880720529581e-07, "epoch": 18.75542933511527, "percentage": 93.78, "elapsed_time": "16:58:26", "remaining_time": "1:07:34", "throughput": 3351.28, "total_tokens": 204784528} +{"current_steps": 168410, "total_steps": 179580, "loss": 0.8528, "lr": 5.870644977954837e-07, "epoch": 18.755986189998886, "percentage": 93.78, "elapsed_time": "16:58:28", "remaining_time": "1:07:33", "throughput": 3351.28, "total_tokens": 204790928} +{"current_steps": 168415, "total_steps": 179580, "loss": 0.6987, "lr": 5.86541154137743e-07, "epoch": 18.756543044882502, "percentage": 93.78, "elapsed_time": "16:58:30", "remaining_time": "1:07:31", "throughput": 3351.28, "total_tokens": 204797232} +{"current_steps": 168420, "total_steps": 179580, "loss": 0.8402, "lr": 5.860180410846794e-07, "epoch": 18.75709989976612, "percentage": 93.79, "elapsed_time": "16:58:31", "remaining_time": "1:07:29", "throughput": 3351.29, "total_tokens": 204803728} +{"current_steps": 168425, "total_steps": 179580, "loss": 0.73, "lr": 5.854951586412388e-07, "epoch": 18.757656754649737, "percentage": 93.79, "elapsed_time": "16:58:33", "remaining_time": "1:07:27", "throughput": 3351.29, "total_tokens": 204809872} +{"current_steps": 168430, "total_steps": 179580, "loss": 0.7998, "lr": 5.849725068123563e-07, "epoch": 18.758213609533357, "percentage": 93.79, "elapsed_time": "16:58:35", "remaining_time": "1:07:25", "throughput": 3351.29, "total_tokens": 204816176} +{"current_steps": 168435, "total_steps": 179580, "loss": 0.7712, "lr": 5.844500856029666e-07, "epoch": 18.758770464416973, "percentage": 93.79, "elapsed_time": "16:58:37", "remaining_time": "1:07:24", "throughput": 3351.3, "total_tokens": 204822384} +{"current_steps": 168440, "total_steps": 179580, "loss": 0.7497, "lr": 5.839278950180105e-07, "epoch": 18.75932731930059, "percentage": 93.8, "elapsed_time": "16:58:39", "remaining_time": "1:07:22", "throughput": 3351.3, "total_tokens": 204828272} +{"current_steps": 168445, "total_steps": 179580, "loss": 0.6606, "lr": 5.834059350624144e-07, "epoch": 18.759884174184208, "percentage": 93.8, "elapsed_time": "16:58:40", "remaining_time": "1:07:20", "throughput": 3351.3, "total_tokens": 204834032} +{"current_steps": 168450, "total_steps": 179580, "loss": 0.8281, "lr": 5.82884205741116e-07, "epoch": 18.760441029067824, "percentage": 93.8, "elapsed_time": "16:58:42", "remaining_time": "1:07:18", "throughput": 3351.3, "total_tokens": 204839920} +{"current_steps": 168455, "total_steps": 179580, "loss": 0.7956, "lr": 5.823627070590337e-07, "epoch": 18.760997883951443, "percentage": 93.8, "elapsed_time": "16:58:44", "remaining_time": "1:07:16", "throughput": 3351.31, "total_tokens": 204846160} +{"current_steps": 168460, "total_steps": 179580, "loss": 0.5516, "lr": 5.818414390211024e-07, "epoch": 18.76155473883506, "percentage": 93.81, "elapsed_time": "16:58:46", "remaining_time": "1:07:14", "throughput": 3351.31, "total_tokens": 204852304} +{"current_steps": 168465, "total_steps": 179580, "loss": 0.8856, "lr": 5.813204016322405e-07, "epoch": 18.76211159371868, "percentage": 93.81, "elapsed_time": "16:58:47", "remaining_time": "1:07:13", "throughput": 3351.31, "total_tokens": 204858480} +{"current_steps": 168470, "total_steps": 179580, "loss": 0.8023, "lr": 5.807995948973716e-07, "epoch": 18.762668448602295, "percentage": 93.81, "elapsed_time": "16:58:49", "remaining_time": "1:07:11", "throughput": 3351.32, "total_tokens": 204864240} +{"current_steps": 168475, "total_steps": 179580, "loss": 0.7386, "lr": 5.802790188214141e-07, "epoch": 18.76322530348591, "percentage": 93.82, "elapsed_time": "16:58:51", "remaining_time": "1:07:09", "throughput": 3351.32, "total_tokens": 204870384} +{"current_steps": 168480, "total_steps": 179580, "loss": 0.9487, "lr": 5.797586734092891e-07, "epoch": 18.76378215836953, "percentage": 93.82, "elapsed_time": "16:58:53", "remaining_time": "1:07:07", "throughput": 3351.32, "total_tokens": 204876560} +{"current_steps": 168485, "total_steps": 179580, "loss": 0.7319, "lr": 5.792385586659038e-07, "epoch": 18.764339013253146, "percentage": 93.82, "elapsed_time": "16:58:54", "remaining_time": "1:07:05", "throughput": 3351.33, "total_tokens": 204882672} +{"current_steps": 168490, "total_steps": 179580, "loss": 0.4798, "lr": 5.787186745961792e-07, "epoch": 18.764895868136765, "percentage": 93.82, "elapsed_time": "16:58:56", "remaining_time": "1:07:04", "throughput": 3351.33, "total_tokens": 204888592} +{"current_steps": 168495, "total_steps": 179580, "loss": 0.6349, "lr": 5.781990212050226e-07, "epoch": 18.76545272302038, "percentage": 93.83, "elapsed_time": "16:58:58", "remaining_time": "1:07:02", "throughput": 3351.33, "total_tokens": 204894256} +{"current_steps": 168500, "total_steps": 179580, "loss": 0.7514, "lr": 5.776795984973438e-07, "epoch": 18.766009577903997, "percentage": 93.83, "elapsed_time": "16:58:59", "remaining_time": "1:07:00", "throughput": 3351.34, "total_tokens": 204900464} +{"current_steps": 168505, "total_steps": 179580, "loss": 0.9552, "lr": 5.771604064780444e-07, "epoch": 18.766566432787616, "percentage": 93.83, "elapsed_time": "16:59:01", "remaining_time": "1:06:58", "throughput": 3351.34, "total_tokens": 204906512} +{"current_steps": 168510, "total_steps": 179580, "loss": 0.727, "lr": 5.766414451520347e-07, "epoch": 18.767123287671232, "percentage": 93.84, "elapsed_time": "16:59:03", "remaining_time": "1:06:56", "throughput": 3351.34, "total_tokens": 204912528} +{"current_steps": 168515, "total_steps": 179580, "loss": 0.7697, "lr": 5.761227145242132e-07, "epoch": 18.767680142554852, "percentage": 93.84, "elapsed_time": "16:59:05", "remaining_time": "1:06:54", "throughput": 3351.35, "total_tokens": 204918576} +{"current_steps": 168520, "total_steps": 179580, "loss": 0.9159, "lr": 5.756042145994816e-07, "epoch": 18.768236997438468, "percentage": 93.84, "elapsed_time": "16:59:06", "remaining_time": "1:06:53", "throughput": 3351.35, "total_tokens": 204924464} +{"current_steps": 168525, "total_steps": 179580, "loss": 0.8217, "lr": 5.750859453827362e-07, "epoch": 18.768793852322084, "percentage": 93.84, "elapsed_time": "16:59:08", "remaining_time": "1:06:51", "throughput": 3351.35, "total_tokens": 204930800} +{"current_steps": 168530, "total_steps": 179580, "loss": 0.7182, "lr": 5.745679068788728e-07, "epoch": 18.769350707205703, "percentage": 93.85, "elapsed_time": "16:59:10", "remaining_time": "1:06:49", "throughput": 3351.36, "total_tokens": 204936976} +{"current_steps": 168535, "total_steps": 179580, "loss": 0.4547, "lr": 5.740500990927849e-07, "epoch": 18.76990756208932, "percentage": 93.85, "elapsed_time": "16:59:12", "remaining_time": "1:06:47", "throughput": 3351.36, "total_tokens": 204943120} +{"current_steps": 168540, "total_steps": 179580, "loss": 0.7602, "lr": 5.73532522029363e-07, "epoch": 18.77046441697294, "percentage": 93.85, "elapsed_time": "16:59:14", "remaining_time": "1:06:45", "throughput": 3351.36, "total_tokens": 204949424} +{"current_steps": 168545, "total_steps": 179580, "loss": 0.5565, "lr": 5.730151756935003e-07, "epoch": 18.771021271856554, "percentage": 93.86, "elapsed_time": "16:59:15", "remaining_time": "1:06:43", "throughput": 3351.37, "total_tokens": 204955312} +{"current_steps": 168550, "total_steps": 179580, "loss": 0.9692, "lr": 5.724980600900764e-07, "epoch": 18.77157812674017, "percentage": 93.86, "elapsed_time": "16:59:17", "remaining_time": "1:06:42", "throughput": 3351.37, "total_tokens": 204961616} +{"current_steps": 168555, "total_steps": 179580, "loss": 0.5486, "lr": 5.71981175223979e-07, "epoch": 18.77213498162379, "percentage": 93.86, "elapsed_time": "16:59:19", "remaining_time": "1:06:40", "throughput": 3351.37, "total_tokens": 204967184} +{"current_steps": 168560, "total_steps": 179580, "loss": 0.5535, "lr": 5.714645211000902e-07, "epoch": 18.772691836507406, "percentage": 93.86, "elapsed_time": "16:59:20", "remaining_time": "1:06:38", "throughput": 3351.37, "total_tokens": 204972720} +{"current_steps": 168565, "total_steps": 179580, "loss": 0.9054, "lr": 5.709480977232922e-07, "epoch": 18.773248691391025, "percentage": 93.87, "elapsed_time": "16:59:22", "remaining_time": "1:06:36", "throughput": 3351.38, "total_tokens": 204978864} +{"current_steps": 168570, "total_steps": 179580, "loss": 0.6601, "lr": 5.704319050984647e-07, "epoch": 18.77380554627464, "percentage": 93.87, "elapsed_time": "16:59:24", "remaining_time": "1:06:34", "throughput": 3351.38, "total_tokens": 204985232} +{"current_steps": 168575, "total_steps": 179580, "loss": 0.7403, "lr": 5.699159432304757e-07, "epoch": 18.774362401158257, "percentage": 93.87, "elapsed_time": "16:59:26", "remaining_time": "1:06:33", "throughput": 3351.38, "total_tokens": 204991408} +{"current_steps": 168580, "total_steps": 179580, "loss": 0.8773, "lr": 5.694002121242048e-07, "epoch": 18.774919256041876, "percentage": 93.87, "elapsed_time": "16:59:28", "remaining_time": "1:06:31", "throughput": 3351.39, "total_tokens": 204997648} +{"current_steps": 168585, "total_steps": 179580, "loss": 0.5687, "lr": 5.688847117845231e-07, "epoch": 18.775476110925492, "percentage": 93.88, "elapsed_time": "16:59:29", "remaining_time": "1:06:29", "throughput": 3351.39, "total_tokens": 205003600} +{"current_steps": 168590, "total_steps": 179580, "loss": 0.7609, "lr": 5.683694422162988e-07, "epoch": 18.77603296580911, "percentage": 93.88, "elapsed_time": "16:59:31", "remaining_time": "1:06:27", "throughput": 3351.39, "total_tokens": 205009968} +{"current_steps": 168595, "total_steps": 179580, "loss": 0.7721, "lr": 5.678544034244004e-07, "epoch": 18.776589820692728, "percentage": 93.88, "elapsed_time": "16:59:33", "remaining_time": "1:06:25", "throughput": 3351.4, "total_tokens": 205016048} +{"current_steps": 168600, "total_steps": 179580, "loss": 0.7954, "lr": 5.673395954136934e-07, "epoch": 18.777146675576343, "percentage": 93.89, "elapsed_time": "16:59:34", "remaining_time": "1:06:23", "throughput": 3351.4, "total_tokens": 205021648} +{"current_steps": 168605, "total_steps": 179580, "loss": 0.7272, "lr": 5.66825018189035e-07, "epoch": 18.777703530459963, "percentage": 93.89, "elapsed_time": "16:59:36", "remaining_time": "1:06:22", "throughput": 3351.4, "total_tokens": 205027632} +{"current_steps": 168610, "total_steps": 179580, "loss": 0.7461, "lr": 5.663106717552907e-07, "epoch": 18.77826038534358, "percentage": 93.89, "elapsed_time": "16:59:38", "remaining_time": "1:06:20", "throughput": 3351.41, "total_tokens": 205034000} +{"current_steps": 168615, "total_steps": 179580, "loss": 0.7325, "lr": 5.657965561173207e-07, "epoch": 18.7788172402272, "percentage": 93.89, "elapsed_time": "16:59:40", "remaining_time": "1:06:18", "throughput": 3351.41, "total_tokens": 205040080} +{"current_steps": 168620, "total_steps": 179580, "loss": 0.9885, "lr": 5.652826712799764e-07, "epoch": 18.779374095110814, "percentage": 93.9, "elapsed_time": "16:59:42", "remaining_time": "1:06:16", "throughput": 3351.41, "total_tokens": 205046192} +{"current_steps": 168625, "total_steps": 179580, "loss": 0.8036, "lr": 5.647690172481124e-07, "epoch": 18.77993094999443, "percentage": 93.9, "elapsed_time": "16:59:43", "remaining_time": "1:06:14", "throughput": 3351.42, "total_tokens": 205052528} +{"current_steps": 168630, "total_steps": 179580, "loss": 0.7761, "lr": 5.642555940265859e-07, "epoch": 18.78048780487805, "percentage": 93.9, "elapsed_time": "16:59:45", "remaining_time": "1:06:13", "throughput": 3351.42, "total_tokens": 205058992} +{"current_steps": 168635, "total_steps": 179580, "loss": 0.6583, "lr": 5.637424016202403e-07, "epoch": 18.781044659761665, "percentage": 93.91, "elapsed_time": "16:59:47", "remaining_time": "1:06:11", "throughput": 3351.43, "total_tokens": 205065264} +{"current_steps": 168640, "total_steps": 179580, "loss": 0.9523, "lr": 5.632294400339299e-07, "epoch": 18.781601514645285, "percentage": 93.91, "elapsed_time": "16:59:49", "remaining_time": "1:06:09", "throughput": 3351.43, "total_tokens": 205071152} +{"current_steps": 168645, "total_steps": 179580, "loss": 0.7744, "lr": 5.627167092724899e-07, "epoch": 18.7821583695289, "percentage": 93.91, "elapsed_time": "16:59:50", "remaining_time": "1:06:07", "throughput": 3351.43, "total_tokens": 205077136} +{"current_steps": 168650, "total_steps": 179580, "loss": 0.6445, "lr": 5.622042093407748e-07, "epoch": 18.782715224412517, "percentage": 93.91, "elapsed_time": "16:59:52", "remaining_time": "1:06:05", "throughput": 3351.43, "total_tokens": 205083056} +{"current_steps": 168655, "total_steps": 179580, "loss": 0.7102, "lr": 5.616919402436166e-07, "epoch": 18.783272079296136, "percentage": 93.92, "elapsed_time": "16:59:54", "remaining_time": "1:06:04", "throughput": 3351.43, "total_tokens": 205089008} +{"current_steps": 168660, "total_steps": 179580, "loss": 0.6813, "lr": 5.611799019858587e-07, "epoch": 18.783828934179752, "percentage": 93.92, "elapsed_time": "16:59:56", "remaining_time": "1:06:02", "throughput": 3351.43, "total_tokens": 205095248} +{"current_steps": 168665, "total_steps": 179580, "loss": 0.702, "lr": 5.606680945723364e-07, "epoch": 18.78438578906337, "percentage": 93.92, "elapsed_time": "16:59:58", "remaining_time": "1:06:00", "throughput": 3351.43, "total_tokens": 205100944} +{"current_steps": 168670, "total_steps": 179580, "loss": 0.6771, "lr": 5.601565180078844e-07, "epoch": 18.784942643946987, "percentage": 93.92, "elapsed_time": "16:59:59", "remaining_time": "1:05:58", "throughput": 3351.44, "total_tokens": 205107344} +{"current_steps": 168675, "total_steps": 179580, "loss": 0.6221, "lr": 5.596451722973379e-07, "epoch": 18.785499498830603, "percentage": 93.93, "elapsed_time": "17:00:01", "remaining_time": "1:05:56", "throughput": 3351.44, "total_tokens": 205113296} +{"current_steps": 168680, "total_steps": 179580, "loss": 0.632, "lr": 5.591340574455178e-07, "epoch": 18.786056353714223, "percentage": 93.93, "elapsed_time": "17:00:03", "remaining_time": "1:05:54", "throughput": 3351.44, "total_tokens": 205119504} +{"current_steps": 168685, "total_steps": 179580, "loss": 0.8407, "lr": 5.586231734572622e-07, "epoch": 18.78661320859784, "percentage": 93.93, "elapsed_time": "17:00:05", "remaining_time": "1:05:53", "throughput": 3351.45, "total_tokens": 205125424} +{"current_steps": 168690, "total_steps": 179580, "loss": 0.633, "lr": 5.581125203373949e-07, "epoch": 18.787170063481458, "percentage": 93.94, "elapsed_time": "17:00:06", "remaining_time": "1:05:51", "throughput": 3351.45, "total_tokens": 205131472} +{"current_steps": 168695, "total_steps": 179580, "loss": 0.7412, "lr": 5.576020980907342e-07, "epoch": 18.787726918365074, "percentage": 93.94, "elapsed_time": "17:00:08", "remaining_time": "1:05:49", "throughput": 3351.45, "total_tokens": 205137520} +{"current_steps": 168700, "total_steps": 179580, "loss": 0.6626, "lr": 5.570919067221042e-07, "epoch": 18.78828377324869, "percentage": 93.94, "elapsed_time": "17:00:10", "remaining_time": "1:05:47", "throughput": 3351.45, "total_tokens": 205143696} +{"current_steps": 168705, "total_steps": 179580, "loss": 0.6789, "lr": 5.565819462363258e-07, "epoch": 18.78884062813231, "percentage": 93.94, "elapsed_time": "17:00:12", "remaining_time": "1:05:45", "throughput": 3351.46, "total_tokens": 205149648} +{"current_steps": 168710, "total_steps": 179580, "loss": 0.8795, "lr": 5.560722166382148e-07, "epoch": 18.789397483015925, "percentage": 93.95, "elapsed_time": "17:00:13", "remaining_time": "1:05:44", "throughput": 3351.46, "total_tokens": 205155216} +{"current_steps": 168715, "total_steps": 179580, "loss": 0.8599, "lr": 5.555627179325868e-07, "epoch": 18.789954337899545, "percentage": 93.95, "elapsed_time": "17:00:15", "remaining_time": "1:05:42", "throughput": 3351.46, "total_tokens": 205161392} +{"current_steps": 168720, "total_steps": 179580, "loss": 0.6193, "lr": 5.550534501242516e-07, "epoch": 18.79051119278316, "percentage": 93.95, "elapsed_time": "17:00:17", "remaining_time": "1:05:40", "throughput": 3351.47, "total_tokens": 205167184} +{"current_steps": 168725, "total_steps": 179580, "loss": 0.5488, "lr": 5.545444132180222e-07, "epoch": 18.791068047666776, "percentage": 93.96, "elapsed_time": "17:00:18", "remaining_time": "1:05:38", "throughput": 3351.47, "total_tokens": 205172912} +{"current_steps": 168730, "total_steps": 179580, "loss": 1.063, "lr": 5.540356072187031e-07, "epoch": 18.791624902550396, "percentage": 93.96, "elapsed_time": "17:00:20", "remaining_time": "1:05:36", "throughput": 3351.47, "total_tokens": 205178992} +{"current_steps": 168735, "total_steps": 179580, "loss": 0.7591, "lr": 5.53527032131107e-07, "epoch": 18.79218175743401, "percentage": 93.96, "elapsed_time": "17:00:22", "remaining_time": "1:05:34", "throughput": 3351.47, "total_tokens": 205185072} +{"current_steps": 168740, "total_steps": 179580, "loss": 0.607, "lr": 5.530186879600358e-07, "epoch": 18.79273861231763, "percentage": 93.96, "elapsed_time": "17:00:24", "remaining_time": "1:05:33", "throughput": 3351.48, "total_tokens": 205191568} +{"current_steps": 168745, "total_steps": 179580, "loss": 0.7702, "lr": 5.525105747102882e-07, "epoch": 18.793295467201247, "percentage": 93.97, "elapsed_time": "17:00:26", "remaining_time": "1:05:31", "throughput": 3351.48, "total_tokens": 205197904} +{"current_steps": 168750, "total_steps": 179580, "loss": 0.6477, "lr": 5.520026923866633e-07, "epoch": 18.793852322084863, "percentage": 93.97, "elapsed_time": "17:00:27", "remaining_time": "1:05:29", "throughput": 3351.49, "total_tokens": 205203792} +{"current_steps": 168755, "total_steps": 179580, "loss": 0.8909, "lr": 5.514950409939629e-07, "epoch": 18.794409176968482, "percentage": 93.97, "elapsed_time": "17:00:29", "remaining_time": "1:05:27", "throughput": 3351.49, "total_tokens": 205209968} +{"current_steps": 168760, "total_steps": 179580, "loss": 0.5798, "lr": 5.509876205369774e-07, "epoch": 18.7949660318521, "percentage": 93.97, "elapsed_time": "17:00:31", "remaining_time": "1:05:25", "throughput": 3351.49, "total_tokens": 205216368} +{"current_steps": 168765, "total_steps": 179580, "loss": 0.6716, "lr": 5.504804310205031e-07, "epoch": 18.795522886735718, "percentage": 93.98, "elapsed_time": "17:00:32", "remaining_time": "1:05:24", "throughput": 3351.5, "total_tokens": 205222096} +{"current_steps": 168770, "total_steps": 179580, "loss": 0.9941, "lr": 5.499734724493305e-07, "epoch": 18.796079741619334, "percentage": 93.98, "elapsed_time": "17:00:34", "remaining_time": "1:05:22", "throughput": 3351.5, "total_tokens": 205228272} +{"current_steps": 168775, "total_steps": 179580, "loss": 0.5784, "lr": 5.494667448282475e-07, "epoch": 18.79663659650295, "percentage": 93.98, "elapsed_time": "17:00:36", "remaining_time": "1:05:20", "throughput": 3351.5, "total_tokens": 205233360} +{"current_steps": 168780, "total_steps": 179580, "loss": 0.6012, "lr": 5.489602481620365e-07, "epoch": 18.79719345138657, "percentage": 93.99, "elapsed_time": "17:00:38", "remaining_time": "1:05:18", "throughput": 3351.51, "total_tokens": 205239568} +{"current_steps": 168785, "total_steps": 179580, "loss": 0.6259, "lr": 5.484539824554935e-07, "epoch": 18.797750306270185, "percentage": 93.99, "elapsed_time": "17:00:39", "remaining_time": "1:05:16", "throughput": 3351.51, "total_tokens": 205245904} +{"current_steps": 168790, "total_steps": 179580, "loss": 0.6728, "lr": 5.47947947713387e-07, "epoch": 18.798307161153804, "percentage": 93.99, "elapsed_time": "17:00:41", "remaining_time": "1:05:14", "throughput": 3351.51, "total_tokens": 205251888} +{"current_steps": 168795, "total_steps": 179580, "loss": 1.0807, "lr": 5.474421439405048e-07, "epoch": 18.79886401603742, "percentage": 93.99, "elapsed_time": "17:00:43", "remaining_time": "1:05:13", "throughput": 3351.52, "total_tokens": 205257904} +{"current_steps": 168800, "total_steps": 179580, "loss": 0.7387, "lr": 5.46936571141618e-07, "epoch": 18.79942087092104, "percentage": 94.0, "elapsed_time": "17:00:45", "remaining_time": "1:05:11", "throughput": 3351.52, "total_tokens": 205264048} +{"current_steps": 168805, "total_steps": 179580, "loss": 0.5642, "lr": 5.464312293215119e-07, "epoch": 18.799977725804656, "percentage": 94.0, "elapsed_time": "17:00:46", "remaining_time": "1:05:09", "throughput": 3351.53, "total_tokens": 205270224} +{"current_steps": 168810, "total_steps": 179580, "loss": 0.7948, "lr": 5.459261184849545e-07, "epoch": 18.80053458068827, "percentage": 94.0, "elapsed_time": "17:00:48", "remaining_time": "1:05:07", "throughput": 3351.53, "total_tokens": 205275792} +{"current_steps": 168815, "total_steps": 179580, "loss": 0.6121, "lr": 5.454212386367175e-07, "epoch": 18.80109143557189, "percentage": 94.01, "elapsed_time": "17:00:50", "remaining_time": "1:05:05", "throughput": 3351.53, "total_tokens": 205281776} +{"current_steps": 168820, "total_steps": 179580, "loss": 0.7629, "lr": 5.449165897815661e-07, "epoch": 18.801648290455507, "percentage": 94.01, "elapsed_time": "17:00:51", "remaining_time": "1:05:03", "throughput": 3351.53, "total_tokens": 205287856} +{"current_steps": 168825, "total_steps": 179580, "loss": 0.8132, "lr": 5.444121719242745e-07, "epoch": 18.802205145339123, "percentage": 94.01, "elapsed_time": "17:00:53", "remaining_time": "1:05:02", "throughput": 3351.53, "total_tokens": 205293328} +{"current_steps": 168830, "total_steps": 179580, "loss": 0.5077, "lr": 5.439079850696028e-07, "epoch": 18.802762000222742, "percentage": 94.01, "elapsed_time": "17:00:55", "remaining_time": "1:05:00", "throughput": 3351.54, "total_tokens": 205299408} +{"current_steps": 168835, "total_steps": 179580, "loss": 0.6256, "lr": 5.434040292223136e-07, "epoch": 18.803318855106358, "percentage": 94.02, "elapsed_time": "17:00:56", "remaining_time": "1:04:58", "throughput": 3351.54, "total_tokens": 205305264} +{"current_steps": 168840, "total_steps": 179580, "loss": 0.8314, "lr": 5.429003043871644e-07, "epoch": 18.803875709989978, "percentage": 94.02, "elapsed_time": "17:00:58", "remaining_time": "1:04:56", "throughput": 3351.54, "total_tokens": 205311632} +{"current_steps": 168845, "total_steps": 179580, "loss": 0.6264, "lr": 5.423968105689209e-07, "epoch": 18.804432564873593, "percentage": 94.02, "elapsed_time": "17:01:00", "remaining_time": "1:04:54", "throughput": 3351.55, "total_tokens": 205317808} +{"current_steps": 168850, "total_steps": 179580, "loss": 0.7417, "lr": 5.418935477723319e-07, "epoch": 18.804989419757213, "percentage": 94.02, "elapsed_time": "17:01:02", "remaining_time": "1:04:53", "throughput": 3351.55, "total_tokens": 205323792} +{"current_steps": 168855, "total_steps": 179580, "loss": 0.7825, "lr": 5.413905160021576e-07, "epoch": 18.80554627464083, "percentage": 94.03, "elapsed_time": "17:01:04", "remaining_time": "1:04:51", "throughput": 3351.55, "total_tokens": 205329648} +{"current_steps": 168860, "total_steps": 179580, "loss": 0.8009, "lr": 5.408877152631414e-07, "epoch": 18.806103129524445, "percentage": 94.03, "elapsed_time": "17:01:05", "remaining_time": "1:04:49", "throughput": 3351.56, "total_tokens": 205335184} +{"current_steps": 168865, "total_steps": 179580, "loss": 0.6877, "lr": 5.403851455600406e-07, "epoch": 18.806659984408064, "percentage": 94.03, "elapsed_time": "17:01:07", "remaining_time": "1:04:47", "throughput": 3351.56, "total_tokens": 205341520} +{"current_steps": 168870, "total_steps": 179580, "loss": 0.7397, "lr": 5.398828068975931e-07, "epoch": 18.80721683929168, "percentage": 94.04, "elapsed_time": "17:01:09", "remaining_time": "1:04:45", "throughput": 3351.56, "total_tokens": 205347760} +{"current_steps": 168875, "total_steps": 179580, "loss": 0.704, "lr": 5.393806992805561e-07, "epoch": 18.8077736941753, "percentage": 94.04, "elapsed_time": "17:01:10", "remaining_time": "1:04:43", "throughput": 3351.57, "total_tokens": 205353296} +{"current_steps": 168880, "total_steps": 179580, "loss": 0.7818, "lr": 5.388788227136621e-07, "epoch": 18.808330549058915, "percentage": 94.04, "elapsed_time": "17:01:12", "remaining_time": "1:04:42", "throughput": 3351.57, "total_tokens": 205359440} +{"current_steps": 168885, "total_steps": 179580, "loss": 0.5913, "lr": 5.383771772016599e-07, "epoch": 18.80888740394253, "percentage": 94.04, "elapsed_time": "17:01:14", "remaining_time": "1:04:40", "throughput": 3351.57, "total_tokens": 205365616} +{"current_steps": 168890, "total_steps": 179580, "loss": 0.6906, "lr": 5.378757627492764e-07, "epoch": 18.80944425882615, "percentage": 94.05, "elapsed_time": "17:01:15", "remaining_time": "1:04:38", "throughput": 3351.58, "total_tokens": 205371024} +{"current_steps": 168895, "total_steps": 179580, "loss": 0.8368, "lr": 5.373745793612605e-07, "epoch": 18.810001113709767, "percentage": 94.05, "elapsed_time": "17:01:17", "remaining_time": "1:04:36", "throughput": 3351.58, "total_tokens": 205376816} +{"current_steps": 168900, "total_steps": 179580, "loss": 0.7148, "lr": 5.368736270423391e-07, "epoch": 18.810557968593386, "percentage": 94.05, "elapsed_time": "17:01:19", "remaining_time": "1:04:34", "throughput": 3351.58, "total_tokens": 205383184} +{"current_steps": 168905, "total_steps": 179580, "loss": 0.6048, "lr": 5.363729057972472e-07, "epoch": 18.811114823477002, "percentage": 94.06, "elapsed_time": "17:01:21", "remaining_time": "1:04:33", "throughput": 3351.59, "total_tokens": 205389776} +{"current_steps": 168910, "total_steps": 179580, "loss": 0.7719, "lr": 5.358724156307116e-07, "epoch": 18.811671678360618, "percentage": 94.06, "elapsed_time": "17:01:23", "remaining_time": "1:04:31", "throughput": 3351.59, "total_tokens": 205395760} +{"current_steps": 168915, "total_steps": 179580, "loss": 0.6641, "lr": 5.353721565474617e-07, "epoch": 18.812228533244237, "percentage": 94.06, "elapsed_time": "17:01:24", "remaining_time": "1:04:29", "throughput": 3351.59, "total_tokens": 205401840} +{"current_steps": 168920, "total_steps": 179580, "loss": 0.6236, "lr": 5.348721285522218e-07, "epoch": 18.812785388127853, "percentage": 94.06, "elapsed_time": "17:01:26", "remaining_time": "1:04:27", "throughput": 3351.59, "total_tokens": 205407184} +{"current_steps": 168925, "total_steps": 179580, "loss": 0.6649, "lr": 5.343723316497184e-07, "epoch": 18.813342243011473, "percentage": 94.07, "elapsed_time": "17:01:28", "remaining_time": "1:04:25", "throughput": 3351.6, "total_tokens": 205413040} +{"current_steps": 168930, "total_steps": 179580, "loss": 0.6319, "lr": 5.338727658446674e-07, "epoch": 18.81389909789509, "percentage": 94.07, "elapsed_time": "17:01:29", "remaining_time": "1:04:23", "throughput": 3351.6, "total_tokens": 205419056} +{"current_steps": 168935, "total_steps": 179580, "loss": 0.7426, "lr": 5.333734311417926e-07, "epoch": 18.814455952778705, "percentage": 94.07, "elapsed_time": "17:01:31", "remaining_time": "1:04:22", "throughput": 3351.6, "total_tokens": 205424976} +{"current_steps": 168940, "total_steps": 179580, "loss": 0.6339, "lr": 5.328743275458043e-07, "epoch": 18.815012807662324, "percentage": 94.08, "elapsed_time": "17:01:33", "remaining_time": "1:04:20", "throughput": 3351.61, "total_tokens": 205430832} +{"current_steps": 168945, "total_steps": 179580, "loss": 0.7402, "lr": 5.323754550614235e-07, "epoch": 18.81556966254594, "percentage": 94.08, "elapsed_time": "17:01:35", "remaining_time": "1:04:18", "throughput": 3351.61, "total_tokens": 205437008} +{"current_steps": 168950, "total_steps": 179580, "loss": 0.5999, "lr": 5.318768136933578e-07, "epoch": 18.81612651742956, "percentage": 94.08, "elapsed_time": "17:01:36", "remaining_time": "1:04:16", "throughput": 3351.61, "total_tokens": 205443120} +{"current_steps": 168955, "total_steps": 179580, "loss": 0.9872, "lr": 5.313784034463226e-07, "epoch": 18.816683372313175, "percentage": 94.08, "elapsed_time": "17:01:38", "remaining_time": "1:04:14", "throughput": 3351.61, "total_tokens": 205449360} +{"current_steps": 168960, "total_steps": 179580, "loss": 0.5744, "lr": 5.308802243250171e-07, "epoch": 18.81724022719679, "percentage": 94.09, "elapsed_time": "17:01:40", "remaining_time": "1:04:13", "throughput": 3351.62, "total_tokens": 205455728} +{"current_steps": 168965, "total_steps": 179580, "loss": 0.9932, "lr": 5.30382276334157e-07, "epoch": 18.81779708208041, "percentage": 94.09, "elapsed_time": "17:01:42", "remaining_time": "1:04:11", "throughput": 3351.62, "total_tokens": 205461648} +{"current_steps": 168970, "total_steps": 179580, "loss": 0.668, "lr": 5.298845594784358e-07, "epoch": 18.818353936964026, "percentage": 94.09, "elapsed_time": "17:01:44", "remaining_time": "1:04:09", "throughput": 3351.63, "total_tokens": 205468240} +{"current_steps": 168975, "total_steps": 179580, "loss": 0.4263, "lr": 5.293870737625662e-07, "epoch": 18.818910791847646, "percentage": 94.09, "elapsed_time": "17:01:45", "remaining_time": "1:04:07", "throughput": 3351.63, "total_tokens": 205474512} +{"current_steps": 168980, "total_steps": 179580, "loss": 0.8204, "lr": 5.288898191912362e-07, "epoch": 18.819467646731262, "percentage": 94.1, "elapsed_time": "17:01:47", "remaining_time": "1:04:05", "throughput": 3351.63, "total_tokens": 205481040} +{"current_steps": 168985, "total_steps": 179580, "loss": 0.6735, "lr": 5.283927957691504e-07, "epoch": 18.820024501614878, "percentage": 94.1, "elapsed_time": "17:01:49", "remaining_time": "1:04:03", "throughput": 3351.64, "total_tokens": 205486992} +{"current_steps": 168990, "total_steps": 179580, "loss": 0.6356, "lr": 5.278960035009994e-07, "epoch": 18.820581356498497, "percentage": 94.1, "elapsed_time": "17:01:51", "remaining_time": "1:04:02", "throughput": 3351.64, "total_tokens": 205493200} +{"current_steps": 168995, "total_steps": 179580, "loss": 0.9919, "lr": 5.273994423914797e-07, "epoch": 18.821138211382113, "percentage": 94.11, "elapsed_time": "17:01:53", "remaining_time": "1:04:00", "throughput": 3351.64, "total_tokens": 205499376} +{"current_steps": 169000, "total_steps": 179580, "loss": 1.1286, "lr": 5.269031124452789e-07, "epoch": 18.821695066265733, "percentage": 94.11, "elapsed_time": "17:01:54", "remaining_time": "1:03:58", "throughput": 3351.65, "total_tokens": 205505680} +{"current_steps": 169005, "total_steps": 179580, "loss": 1.0183, "lr": 5.264070136670851e-07, "epoch": 18.82225192114935, "percentage": 94.11, "elapsed_time": "17:01:56", "remaining_time": "1:03:56", "throughput": 3351.65, "total_tokens": 205511824} +{"current_steps": 169010, "total_steps": 179580, "loss": 0.7758, "lr": 5.259111460615834e-07, "epoch": 18.822808776032964, "percentage": 94.11, "elapsed_time": "17:01:58", "remaining_time": "1:03:54", "throughput": 3351.66, "total_tokens": 205518160} +{"current_steps": 169015, "total_steps": 179580, "loss": 1.037, "lr": 5.254155096334618e-07, "epoch": 18.823365630916584, "percentage": 94.12, "elapsed_time": "17:02:00", "remaining_time": "1:03:53", "throughput": 3351.66, "total_tokens": 205524336} +{"current_steps": 169020, "total_steps": 179580, "loss": 0.8455, "lr": 5.249201043873996e-07, "epoch": 18.8239224858002, "percentage": 94.12, "elapsed_time": "17:02:01", "remaining_time": "1:03:51", "throughput": 3351.66, "total_tokens": 205530640} +{"current_steps": 169025, "total_steps": 179580, "loss": 0.9831, "lr": 5.244249303280741e-07, "epoch": 18.82447934068382, "percentage": 94.12, "elapsed_time": "17:02:03", "remaining_time": "1:03:49", "throughput": 3351.67, "total_tokens": 205536880} +{"current_steps": 169030, "total_steps": 179580, "loss": 0.8228, "lr": 5.239299874601644e-07, "epoch": 18.825036195567435, "percentage": 94.13, "elapsed_time": "17:02:05", "remaining_time": "1:03:47", "throughput": 3351.67, "total_tokens": 205542896} +{"current_steps": 169035, "total_steps": 179580, "loss": 0.6228, "lr": 5.234352757883476e-07, "epoch": 18.82559305045105, "percentage": 94.13, "elapsed_time": "17:02:07", "remaining_time": "1:03:45", "throughput": 3351.67, "total_tokens": 205548752} +{"current_steps": 169040, "total_steps": 179580, "loss": 0.8464, "lr": 5.229407953172922e-07, "epoch": 18.82614990533467, "percentage": 94.13, "elapsed_time": "17:02:08", "remaining_time": "1:03:43", "throughput": 3351.68, "total_tokens": 205554544} +{"current_steps": 169045, "total_steps": 179580, "loss": 0.6095, "lr": 5.224465460516775e-07, "epoch": 18.826706760218286, "percentage": 94.13, "elapsed_time": "17:02:10", "remaining_time": "1:03:42", "throughput": 3351.68, "total_tokens": 205560880} +{"current_steps": 169050, "total_steps": 179580, "loss": 0.6206, "lr": 5.219525279961585e-07, "epoch": 18.827263615101906, "percentage": 94.14, "elapsed_time": "17:02:12", "remaining_time": "1:03:40", "throughput": 3351.68, "total_tokens": 205566992} +{"current_steps": 169055, "total_steps": 179580, "loss": 0.5568, "lr": 5.214587411554145e-07, "epoch": 18.82782046998552, "percentage": 94.14, "elapsed_time": "17:02:14", "remaining_time": "1:03:38", "throughput": 3351.69, "total_tokens": 205573040} +{"current_steps": 169060, "total_steps": 179580, "loss": 0.5853, "lr": 5.20965185534103e-07, "epoch": 18.828377324869138, "percentage": 94.14, "elapsed_time": "17:02:15", "remaining_time": "1:03:36", "throughput": 3351.69, "total_tokens": 205578704} +{"current_steps": 169065, "total_steps": 179580, "loss": 0.6598, "lr": 5.204718611368869e-07, "epoch": 18.828934179752757, "percentage": 94.14, "elapsed_time": "17:02:17", "remaining_time": "1:03:34", "throughput": 3351.69, "total_tokens": 205584720} +{"current_steps": 169070, "total_steps": 179580, "loss": 0.72, "lr": 5.199787679684292e-07, "epoch": 18.829491034636373, "percentage": 94.15, "elapsed_time": "17:02:19", "remaining_time": "1:03:33", "throughput": 3351.7, "total_tokens": 205590928} +{"current_steps": 169075, "total_steps": 179580, "loss": 0.8396, "lr": 5.194859060333845e-07, "epoch": 18.830047889519992, "percentage": 94.15, "elapsed_time": "17:02:21", "remaining_time": "1:03:31", "throughput": 3351.7, "total_tokens": 205597360} +{"current_steps": 169080, "total_steps": 179580, "loss": 0.6165, "lr": 5.189932753364074e-07, "epoch": 18.830604744403608, "percentage": 94.15, "elapsed_time": "17:02:22", "remaining_time": "1:03:29", "throughput": 3351.7, "total_tokens": 205603440} +{"current_steps": 169085, "total_steps": 179580, "loss": 0.7421, "lr": 5.185008758821525e-07, "epoch": 18.831161599287224, "percentage": 94.16, "elapsed_time": "17:02:24", "remaining_time": "1:03:27", "throughput": 3351.71, "total_tokens": 205609168} +{"current_steps": 169090, "total_steps": 179580, "loss": 0.8253, "lr": 5.180087076752716e-07, "epoch": 18.831718454170844, "percentage": 94.16, "elapsed_time": "17:02:26", "remaining_time": "1:03:25", "throughput": 3351.71, "total_tokens": 205615248} +{"current_steps": 169095, "total_steps": 179580, "loss": 0.682, "lr": 5.175167707204137e-07, "epoch": 18.83227530905446, "percentage": 94.16, "elapsed_time": "17:02:28", "remaining_time": "1:03:23", "throughput": 3351.71, "total_tokens": 205621328} +{"current_steps": 169100, "total_steps": 179580, "loss": 0.7433, "lr": 5.170250650222253e-07, "epoch": 18.83283216393808, "percentage": 94.16, "elapsed_time": "17:02:29", "remaining_time": "1:03:22", "throughput": 3351.72, "total_tokens": 205627152} +{"current_steps": 169105, "total_steps": 179580, "loss": 0.7655, "lr": 5.165335905853497e-07, "epoch": 18.833389018821695, "percentage": 94.17, "elapsed_time": "17:02:31", "remaining_time": "1:03:20", "throughput": 3351.71, "total_tokens": 205632496} +{"current_steps": 169110, "total_steps": 179580, "loss": 0.5851, "lr": 5.160423474144305e-07, "epoch": 18.83394587370531, "percentage": 94.17, "elapsed_time": "17:02:33", "remaining_time": "1:03:18", "throughput": 3351.71, "total_tokens": 205638032} +{"current_steps": 169115, "total_steps": 179580, "loss": 0.9312, "lr": 5.155513355141056e-07, "epoch": 18.83450272858893, "percentage": 94.17, "elapsed_time": "17:02:35", "remaining_time": "1:03:16", "throughput": 3351.71, "total_tokens": 205644208} +{"current_steps": 169120, "total_steps": 179580, "loss": 0.9412, "lr": 5.150605548890186e-07, "epoch": 18.835059583472546, "percentage": 94.18, "elapsed_time": "17:02:36", "remaining_time": "1:03:14", "throughput": 3351.71, "total_tokens": 205649552} +{"current_steps": 169125, "total_steps": 179580, "loss": 0.7083, "lr": 5.145700055437991e-07, "epoch": 18.835616438356166, "percentage": 94.18, "elapsed_time": "17:02:38", "remaining_time": "1:03:13", "throughput": 3351.71, "total_tokens": 205655632} +{"current_steps": 169130, "total_steps": 179580, "loss": 0.5752, "lr": 5.14079687483085e-07, "epoch": 18.83617329323978, "percentage": 94.18, "elapsed_time": "17:02:40", "remaining_time": "1:03:11", "throughput": 3351.72, "total_tokens": 205661520} +{"current_steps": 169135, "total_steps": 179580, "loss": 0.5341, "lr": 5.135896007115032e-07, "epoch": 18.8367301481234, "percentage": 94.18, "elapsed_time": "17:02:41", "remaining_time": "1:03:09", "throughput": 3351.72, "total_tokens": 205668016} +{"current_steps": 169140, "total_steps": 179580, "loss": 0.8065, "lr": 5.130997452336889e-07, "epoch": 18.837287003007017, "percentage": 94.19, "elapsed_time": "17:02:43", "remaining_time": "1:03:07", "throughput": 3351.73, "total_tokens": 205674128} +{"current_steps": 169145, "total_steps": 179580, "loss": 0.7249, "lr": 5.126101210542661e-07, "epoch": 18.837843857890633, "percentage": 94.19, "elapsed_time": "17:02:45", "remaining_time": "1:03:05", "throughput": 3351.73, "total_tokens": 205680368} +{"current_steps": 169150, "total_steps": 179580, "loss": 0.7236, "lr": 5.12120728177859e-07, "epoch": 18.838400712774252, "percentage": 94.19, "elapsed_time": "17:02:47", "remaining_time": "1:03:03", "throughput": 3351.73, "total_tokens": 205686576} +{"current_steps": 169155, "total_steps": 179580, "loss": 0.5089, "lr": 5.116315666090887e-07, "epoch": 18.838957567657868, "percentage": 94.19, "elapsed_time": "17:02:49", "remaining_time": "1:03:02", "throughput": 3351.74, "total_tokens": 205693072} +{"current_steps": 169160, "total_steps": 179580, "loss": 0.6712, "lr": 5.111426363525795e-07, "epoch": 18.839514422541484, "percentage": 94.2, "elapsed_time": "17:02:50", "remaining_time": "1:03:00", "throughput": 3351.74, "total_tokens": 205699184} +{"current_steps": 169165, "total_steps": 179580, "loss": 0.6246, "lr": 5.106539374129499e-07, "epoch": 18.840071277425103, "percentage": 94.2, "elapsed_time": "17:02:52", "remaining_time": "1:02:58", "throughput": 3351.74, "total_tokens": 205705520} +{"current_steps": 169170, "total_steps": 179580, "loss": 0.8486, "lr": 5.101654697948127e-07, "epoch": 18.84062813230872, "percentage": 94.2, "elapsed_time": "17:02:54", "remaining_time": "1:02:56", "throughput": 3351.75, "total_tokens": 205711696} +{"current_steps": 169175, "total_steps": 179580, "loss": 0.8379, "lr": 5.09677233502781e-07, "epoch": 18.84118498719234, "percentage": 94.21, "elapsed_time": "17:02:56", "remaining_time": "1:02:54", "throughput": 3351.75, "total_tokens": 205717488} +{"current_steps": 169180, "total_steps": 179580, "loss": 0.6319, "lr": 5.091892285414735e-07, "epoch": 18.841741842075955, "percentage": 94.21, "elapsed_time": "17:02:57", "remaining_time": "1:02:53", "throughput": 3351.75, "total_tokens": 205723632} +{"current_steps": 169185, "total_steps": 179580, "loss": 0.8479, "lr": 5.087014549154917e-07, "epoch": 18.842298696959574, "percentage": 94.21, "elapsed_time": "17:02:59", "remaining_time": "1:02:51", "throughput": 3351.75, "total_tokens": 205729488} +{"current_steps": 169190, "total_steps": 179580, "loss": 0.7891, "lr": 5.082139126294516e-07, "epoch": 18.84285555184319, "percentage": 94.21, "elapsed_time": "17:03:01", "remaining_time": "1:02:49", "throughput": 3351.76, "total_tokens": 205735696} +{"current_steps": 169195, "total_steps": 179580, "loss": 0.6713, "lr": 5.077266016879495e-07, "epoch": 18.843412406726806, "percentage": 94.22, "elapsed_time": "17:03:03", "remaining_time": "1:02:47", "throughput": 3351.76, "total_tokens": 205741840} +{"current_steps": 169200, "total_steps": 179580, "loss": 0.8929, "lr": 5.072395220955956e-07, "epoch": 18.843969261610425, "percentage": 94.22, "elapsed_time": "17:03:04", "remaining_time": "1:02:45", "throughput": 3351.76, "total_tokens": 205747888} +{"current_steps": 169205, "total_steps": 179580, "loss": 0.7345, "lr": 5.067526738569834e-07, "epoch": 18.84452611649404, "percentage": 94.22, "elapsed_time": "17:03:06", "remaining_time": "1:02:43", "throughput": 3351.77, "total_tokens": 205753872} +{"current_steps": 169210, "total_steps": 179580, "loss": 0.7474, "lr": 5.062660569767203e-07, "epoch": 18.84508297137766, "percentage": 94.23, "elapsed_time": "17:03:08", "remaining_time": "1:02:42", "throughput": 3351.77, "total_tokens": 205760048} +{"current_steps": 169215, "total_steps": 179580, "loss": 0.6828, "lr": 5.05779671459397e-07, "epoch": 18.845639826261277, "percentage": 94.23, "elapsed_time": "17:03:10", "remaining_time": "1:02:40", "throughput": 3351.77, "total_tokens": 205766160} +{"current_steps": 169220, "total_steps": 179580, "loss": 0.8322, "lr": 5.052935173096102e-07, "epoch": 18.846196681144892, "percentage": 94.23, "elapsed_time": "17:03:11", "remaining_time": "1:02:38", "throughput": 3351.78, "total_tokens": 205772272} +{"current_steps": 169225, "total_steps": 179580, "loss": 0.5934, "lr": 5.048075945319475e-07, "epoch": 18.846753536028512, "percentage": 94.23, "elapsed_time": "17:03:13", "remaining_time": "1:02:36", "throughput": 3351.78, "total_tokens": 205777904} +{"current_steps": 169230, "total_steps": 179580, "loss": 0.7707, "lr": 5.043219031310053e-07, "epoch": 18.847310390912128, "percentage": 94.24, "elapsed_time": "17:03:15", "remaining_time": "1:02:34", "throughput": 3351.78, "total_tokens": 205784048} +{"current_steps": 169235, "total_steps": 179580, "loss": 0.6983, "lr": 5.038364431113662e-07, "epoch": 18.847867245795747, "percentage": 94.24, "elapsed_time": "17:03:17", "remaining_time": "1:02:33", "throughput": 3351.79, "total_tokens": 205789648} +{"current_steps": 169240, "total_steps": 179580, "loss": 0.6261, "lr": 5.033512144776209e-07, "epoch": 18.848424100679363, "percentage": 94.24, "elapsed_time": "17:03:18", "remaining_time": "1:02:31", "throughput": 3351.79, "total_tokens": 205795664} +{"current_steps": 169245, "total_steps": 179580, "loss": 0.5027, "lr": 5.028662172343462e-07, "epoch": 18.84898095556298, "percentage": 94.24, "elapsed_time": "17:03:20", "remaining_time": "1:02:29", "throughput": 3351.79, "total_tokens": 205801680} +{"current_steps": 169250, "total_steps": 179580, "loss": 0.7808, "lr": 5.023814513861302e-07, "epoch": 18.8495378104466, "percentage": 94.25, "elapsed_time": "17:03:22", "remaining_time": "1:02:27", "throughput": 3351.79, "total_tokens": 205807728} +{"current_steps": 169255, "total_steps": 179580, "loss": 0.9497, "lr": 5.018969169375443e-07, "epoch": 18.850094665330214, "percentage": 94.25, "elapsed_time": "17:03:24", "remaining_time": "1:02:25", "throughput": 3351.8, "total_tokens": 205813808} +{"current_steps": 169260, "total_steps": 179580, "loss": 0.8085, "lr": 5.014126138931763e-07, "epoch": 18.850651520213834, "percentage": 94.25, "elapsed_time": "17:03:25", "remaining_time": "1:02:23", "throughput": 3351.8, "total_tokens": 205819760} +{"current_steps": 169265, "total_steps": 179580, "loss": 0.7753, "lr": 5.009285422575866e-07, "epoch": 18.85120837509745, "percentage": 94.26, "elapsed_time": "17:03:27", "remaining_time": "1:02:22", "throughput": 3351.8, "total_tokens": 205826288} +{"current_steps": 169270, "total_steps": 179580, "loss": 0.665, "lr": 5.004447020353603e-07, "epoch": 18.851765229981066, "percentage": 94.26, "elapsed_time": "17:03:29", "remaining_time": "1:02:20", "throughput": 3351.81, "total_tokens": 205832688} +{"current_steps": 169275, "total_steps": 179580, "loss": 0.5228, "lr": 4.999610932310578e-07, "epoch": 18.852322084864685, "percentage": 94.26, "elapsed_time": "17:03:31", "remaining_time": "1:02:18", "throughput": 3351.81, "total_tokens": 205839152} +{"current_steps": 169280, "total_steps": 179580, "loss": 0.5938, "lr": 4.994777158492559e-07, "epoch": 18.8528789397483, "percentage": 94.26, "elapsed_time": "17:03:33", "remaining_time": "1:02:16", "throughput": 3351.82, "total_tokens": 205845584} +{"current_steps": 169285, "total_steps": 179580, "loss": 0.8931, "lr": 4.989945698945148e-07, "epoch": 18.85343579463192, "percentage": 94.27, "elapsed_time": "17:03:35", "remaining_time": "1:02:14", "throughput": 3351.82, "total_tokens": 205852144} +{"current_steps": 169290, "total_steps": 179580, "loss": 0.6441, "lr": 4.985116553714031e-07, "epoch": 18.853992649515536, "percentage": 94.27, "elapsed_time": "17:03:36", "remaining_time": "1:02:13", "throughput": 3351.83, "total_tokens": 205858320} +{"current_steps": 169295, "total_steps": 179580, "loss": 0.7327, "lr": 4.980289722844727e-07, "epoch": 18.854549504399152, "percentage": 94.27, "elapsed_time": "17:03:38", "remaining_time": "1:02:11", "throughput": 3351.83, "total_tokens": 205864624} +{"current_steps": 169300, "total_steps": 179580, "loss": 0.6911, "lr": 4.975465206382951e-07, "epoch": 18.85510635928277, "percentage": 94.28, "elapsed_time": "17:03:40", "remaining_time": "1:02:09", "throughput": 3351.83, "total_tokens": 205870576} +{"current_steps": 169305, "total_steps": 179580, "loss": 0.6953, "lr": 4.970643004374192e-07, "epoch": 18.855663214166388, "percentage": 94.28, "elapsed_time": "17:03:42", "remaining_time": "1:02:07", "throughput": 3351.84, "total_tokens": 205876688} +{"current_steps": 169310, "total_steps": 179580, "loss": 0.6928, "lr": 4.965823116864055e-07, "epoch": 18.856220069050007, "percentage": 94.28, "elapsed_time": "17:03:43", "remaining_time": "1:02:05", "throughput": 3351.84, "total_tokens": 205881648} +{"current_steps": 169315, "total_steps": 179580, "loss": 0.7375, "lr": 4.961005543897973e-07, "epoch": 18.856776923933623, "percentage": 94.28, "elapsed_time": "17:03:45", "remaining_time": "1:02:04", "throughput": 3351.84, "total_tokens": 205887536} +{"current_steps": 169320, "total_steps": 179580, "loss": 0.5961, "lr": 4.956190285521578e-07, "epoch": 18.85733377881724, "percentage": 94.29, "elapsed_time": "17:03:46", "remaining_time": "1:02:02", "throughput": 3351.84, "total_tokens": 205893456} +{"current_steps": 169325, "total_steps": 179580, "loss": 0.8871, "lr": 4.951377341780251e-07, "epoch": 18.85789063370086, "percentage": 94.29, "elapsed_time": "17:03:48", "remaining_time": "1:02:00", "throughput": 3351.84, "total_tokens": 205899344} +{"current_steps": 169330, "total_steps": 179580, "loss": 0.6311, "lr": 4.946566712719508e-07, "epoch": 18.858447488584474, "percentage": 94.29, "elapsed_time": "17:03:50", "remaining_time": "1:01:58", "throughput": 3351.85, "total_tokens": 205905360} +{"current_steps": 169335, "total_steps": 179580, "loss": 0.8004, "lr": 4.941758398384789e-07, "epoch": 18.859004343468094, "percentage": 94.3, "elapsed_time": "17:03:52", "remaining_time": "1:01:56", "throughput": 3351.85, "total_tokens": 205911504} +{"current_steps": 169340, "total_steps": 179580, "loss": 0.7614, "lr": 4.93695239882147e-07, "epoch": 18.85956119835171, "percentage": 94.3, "elapsed_time": "17:03:54", "remaining_time": "1:01:54", "throughput": 3351.85, "total_tokens": 205917712} +{"current_steps": 169345, "total_steps": 179580, "loss": 0.6432, "lr": 4.932148714074991e-07, "epoch": 18.860118053235325, "percentage": 94.3, "elapsed_time": "17:03:55", "remaining_time": "1:01:53", "throughput": 3351.85, "total_tokens": 205923664} +{"current_steps": 169350, "total_steps": 179580, "loss": 0.5725, "lr": 4.92734734419073e-07, "epoch": 18.860674908118945, "percentage": 94.3, "elapsed_time": "17:03:57", "remaining_time": "1:01:51", "throughput": 3351.86, "total_tokens": 205929936} +{"current_steps": 169355, "total_steps": 179580, "loss": 0.9338, "lr": 4.922548289214012e-07, "epoch": 18.86123176300256, "percentage": 94.31, "elapsed_time": "17:03:59", "remaining_time": "1:01:49", "throughput": 3351.86, "total_tokens": 205935536} +{"current_steps": 169360, "total_steps": 179580, "loss": 0.6618, "lr": 4.917751549190164e-07, "epoch": 18.86178861788618, "percentage": 94.31, "elapsed_time": "17:04:00", "remaining_time": "1:01:47", "throughput": 3351.87, "total_tokens": 205941840} +{"current_steps": 169365, "total_steps": 179580, "loss": 0.6706, "lr": 4.912957124164508e-07, "epoch": 18.862345472769796, "percentage": 94.31, "elapsed_time": "17:04:02", "remaining_time": "1:01:45", "throughput": 3351.87, "total_tokens": 205947760} +{"current_steps": 169370, "total_steps": 179580, "loss": 0.9087, "lr": 4.90816501418237e-07, "epoch": 18.862902327653412, "percentage": 94.31, "elapsed_time": "17:04:04", "remaining_time": "1:01:44", "throughput": 3351.87, "total_tokens": 205953968} +{"current_steps": 169375, "total_steps": 179580, "loss": 1.0241, "lr": 4.903375219288936e-07, "epoch": 18.86345918253703, "percentage": 94.32, "elapsed_time": "17:04:06", "remaining_time": "1:01:42", "throughput": 3351.87, "total_tokens": 205959632} +{"current_steps": 169380, "total_steps": 179580, "loss": 0.6301, "lr": 4.898587739529531e-07, "epoch": 18.864016037420647, "percentage": 94.32, "elapsed_time": "17:04:07", "remaining_time": "1:01:40", "throughput": 3351.88, "total_tokens": 205966064} +{"current_steps": 169385, "total_steps": 179580, "loss": 0.7376, "lr": 4.893802574949285e-07, "epoch": 18.864572892304267, "percentage": 94.32, "elapsed_time": "17:04:09", "remaining_time": "1:01:38", "throughput": 3351.88, "total_tokens": 205972016} +{"current_steps": 169390, "total_steps": 179580, "loss": 0.6926, "lr": 4.889019725593497e-07, "epoch": 18.865129747187883, "percentage": 94.33, "elapsed_time": "17:04:11", "remaining_time": "1:01:36", "throughput": 3351.89, "total_tokens": 205978096} +{"current_steps": 169395, "total_steps": 179580, "loss": 0.5421, "lr": 4.884239191507239e-07, "epoch": 18.8656866020715, "percentage": 94.33, "elapsed_time": "17:04:13", "remaining_time": "1:01:34", "throughput": 3351.89, "total_tokens": 205984368} +{"current_steps": 169400, "total_steps": 179580, "loss": 0.698, "lr": 4.879460972735784e-07, "epoch": 18.866243456955118, "percentage": 94.33, "elapsed_time": "17:04:14", "remaining_time": "1:01:33", "throughput": 3351.89, "total_tokens": 205990448} +{"current_steps": 169405, "total_steps": 179580, "loss": 0.7731, "lr": 4.874685069324203e-07, "epoch": 18.866800311838734, "percentage": 94.33, "elapsed_time": "17:04:16", "remaining_time": "1:01:31", "throughput": 3351.9, "total_tokens": 205996656} +{"current_steps": 169410, "total_steps": 179580, "loss": 0.6961, "lr": 4.869911481317601e-07, "epoch": 18.867357166722353, "percentage": 94.34, "elapsed_time": "17:04:18", "remaining_time": "1:01:29", "throughput": 3351.9, "total_tokens": 206002576} +{"current_steps": 169415, "total_steps": 179580, "loss": 0.8009, "lr": 4.865140208761054e-07, "epoch": 18.86791402160597, "percentage": 94.34, "elapsed_time": "17:04:20", "remaining_time": "1:01:27", "throughput": 3351.9, "total_tokens": 206008752} +{"current_steps": 169420, "total_steps": 179580, "loss": 0.6752, "lr": 4.860371251699691e-07, "epoch": 18.868470876489585, "percentage": 94.34, "elapsed_time": "17:04:22", "remaining_time": "1:01:25", "throughput": 3351.9, "total_tokens": 206014928} +{"current_steps": 169425, "total_steps": 179580, "loss": 0.8621, "lr": 4.855604610178505e-07, "epoch": 18.869027731373205, "percentage": 94.35, "elapsed_time": "17:04:23", "remaining_time": "1:01:24", "throughput": 3351.91, "total_tokens": 206021200} +{"current_steps": 169430, "total_steps": 179580, "loss": 0.7834, "lr": 4.850840284242541e-07, "epoch": 18.86958458625682, "percentage": 94.35, "elapsed_time": "17:04:25", "remaining_time": "1:01:22", "throughput": 3351.91, "total_tokens": 206027664} +{"current_steps": 169435, "total_steps": 179580, "loss": 0.7427, "lr": 4.846078273936794e-07, "epoch": 18.87014144114044, "percentage": 94.35, "elapsed_time": "17:04:27", "remaining_time": "1:01:20", "throughput": 3351.92, "total_tokens": 206034000} +{"current_steps": 169440, "total_steps": 179580, "loss": 0.8021, "lr": 4.841318579306281e-07, "epoch": 18.870698296024056, "percentage": 94.35, "elapsed_time": "17:04:29", "remaining_time": "1:01:18", "throughput": 3351.92, "total_tokens": 206040176} +{"current_steps": 169445, "total_steps": 179580, "loss": 0.7579, "lr": 4.836561200395912e-07, "epoch": 18.871255150907672, "percentage": 94.36, "elapsed_time": "17:04:31", "remaining_time": "1:01:16", "throughput": 3351.92, "total_tokens": 206046288} +{"current_steps": 169450, "total_steps": 179580, "loss": 0.7345, "lr": 4.831806137250649e-07, "epoch": 18.87181200579129, "percentage": 94.36, "elapsed_time": "17:04:32", "remaining_time": "1:01:14", "throughput": 3351.93, "total_tokens": 206052112} +{"current_steps": 169455, "total_steps": 179580, "loss": 0.8269, "lr": 4.827053389915404e-07, "epoch": 18.872368860674907, "percentage": 94.36, "elapsed_time": "17:04:34", "remaining_time": "1:01:13", "throughput": 3351.92, "total_tokens": 206058096} +{"current_steps": 169460, "total_steps": 179580, "loss": 0.6609, "lr": 4.822302958435054e-07, "epoch": 18.872925715558527, "percentage": 94.36, "elapsed_time": "17:04:36", "remaining_time": "1:01:11", "throughput": 3351.92, "total_tokens": 206064240} +{"current_steps": 169465, "total_steps": 179580, "loss": 0.5407, "lr": 4.817554842854483e-07, "epoch": 18.873482570442143, "percentage": 94.37, "elapsed_time": "17:04:38", "remaining_time": "1:01:09", "throughput": 3351.93, "total_tokens": 206070128} +{"current_steps": 169470, "total_steps": 179580, "loss": 0.6603, "lr": 4.812809043218569e-07, "epoch": 18.87403942532576, "percentage": 94.37, "elapsed_time": "17:04:39", "remaining_time": "1:01:07", "throughput": 3351.93, "total_tokens": 206076240} +{"current_steps": 169475, "total_steps": 179580, "loss": 0.6646, "lr": 4.808065559572112e-07, "epoch": 18.874596280209378, "percentage": 94.37, "elapsed_time": "17:04:41", "remaining_time": "1:01:05", "throughput": 3351.93, "total_tokens": 206082352} +{"current_steps": 169480, "total_steps": 179580, "loss": 0.6978, "lr": 4.803324391959907e-07, "epoch": 18.875153135092994, "percentage": 94.38, "elapsed_time": "17:04:43", "remaining_time": "1:01:04", "throughput": 3351.94, "total_tokens": 206088400} +{"current_steps": 169485, "total_steps": 179580, "loss": 0.7758, "lr": 4.798585540426781e-07, "epoch": 18.875709989976613, "percentage": 94.38, "elapsed_time": "17:04:44", "remaining_time": "1:01:02", "throughput": 3351.94, "total_tokens": 206093968} +{"current_steps": 169490, "total_steps": 179580, "loss": 0.6008, "lr": 4.79384900501742e-07, "epoch": 18.87626684486023, "percentage": 94.38, "elapsed_time": "17:04:46", "remaining_time": "1:01:00", "throughput": 3351.94, "total_tokens": 206100304} +{"current_steps": 169495, "total_steps": 179580, "loss": 0.6531, "lr": 4.789114785776649e-07, "epoch": 18.876823699743845, "percentage": 94.38, "elapsed_time": "17:04:48", "remaining_time": "1:00:58", "throughput": 3351.95, "total_tokens": 206106128} +{"current_steps": 169500, "total_steps": 179580, "loss": 0.6968, "lr": 4.784382882749127e-07, "epoch": 18.877380554627464, "percentage": 94.39, "elapsed_time": "17:04:50", "remaining_time": "1:00:56", "throughput": 3351.95, "total_tokens": 206112464} +{"current_steps": 169505, "total_steps": 179580, "loss": 0.775, "lr": 4.779653295979569e-07, "epoch": 18.87793740951108, "percentage": 94.39, "elapsed_time": "17:04:52", "remaining_time": "1:00:54", "throughput": 3351.95, "total_tokens": 206118320} +{"current_steps": 169510, "total_steps": 179580, "loss": 0.7655, "lr": 4.77492602551266e-07, "epoch": 18.8784942643947, "percentage": 94.39, "elapsed_time": "17:04:53", "remaining_time": "1:00:53", "throughput": 3351.95, "total_tokens": 206124208} +{"current_steps": 169515, "total_steps": 179580, "loss": 0.7659, "lr": 4.77020107139306e-07, "epoch": 18.879051119278316, "percentage": 94.4, "elapsed_time": "17:04:55", "remaining_time": "1:00:51", "throughput": 3351.96, "total_tokens": 206130384} +{"current_steps": 169520, "total_steps": 179580, "loss": 0.7171, "lr": 4.7654784336653437e-07, "epoch": 18.879607974161935, "percentage": 94.4, "elapsed_time": "17:04:57", "remaining_time": "1:00:49", "throughput": 3351.96, "total_tokens": 206136528} +{"current_steps": 169525, "total_steps": 179580, "loss": 0.7856, "lr": 4.760758112374225e-07, "epoch": 18.88016482904555, "percentage": 94.4, "elapsed_time": "17:04:59", "remaining_time": "1:00:47", "throughput": 3351.96, "total_tokens": 206142832} +{"current_steps": 169530, "total_steps": 179580, "loss": 0.6636, "lr": 4.756040107564169e-07, "epoch": 18.880721683929167, "percentage": 94.4, "elapsed_time": "17:05:00", "remaining_time": "1:00:45", "throughput": 3351.97, "total_tokens": 206148720} +{"current_steps": 169535, "total_steps": 179580, "loss": 0.859, "lr": 4.7513244192798347e-07, "epoch": 18.881278538812786, "percentage": 94.41, "elapsed_time": "17:05:02", "remaining_time": "1:00:44", "throughput": 3351.97, "total_tokens": 206154608} +{"current_steps": 169540, "total_steps": 179580, "loss": 0.7875, "lr": 4.7466110475657134e-07, "epoch": 18.881835393696402, "percentage": 94.41, "elapsed_time": "17:05:04", "remaining_time": "1:00:42", "throughput": 3351.97, "total_tokens": 206160688} +{"current_steps": 169545, "total_steps": 179580, "loss": 0.637, "lr": 4.7418999924663533e-07, "epoch": 18.88239224858002, "percentage": 94.41, "elapsed_time": "17:05:06", "remaining_time": "1:00:40", "throughput": 3351.98, "total_tokens": 206166896} +{"current_steps": 169550, "total_steps": 179580, "loss": 0.7024, "lr": 4.7371912540262466e-07, "epoch": 18.882949103463638, "percentage": 94.41, "elapsed_time": "17:05:07", "remaining_time": "1:00:38", "throughput": 3351.98, "total_tokens": 206173232} +{"current_steps": 169555, "total_steps": 179580, "loss": 0.7313, "lr": 4.732484832289885e-07, "epoch": 18.883505958347254, "percentage": 94.42, "elapsed_time": "17:05:09", "remaining_time": "1:00:36", "throughput": 3351.99, "total_tokens": 206179536} +{"current_steps": 169560, "total_steps": 179580, "loss": 0.6492, "lr": 4.7277807273016783e-07, "epoch": 18.884062813230873, "percentage": 94.42, "elapsed_time": "17:05:11", "remaining_time": "1:00:34", "throughput": 3351.99, "total_tokens": 206185744} +{"current_steps": 169565, "total_steps": 179580, "loss": 0.7197, "lr": 4.7230789391061183e-07, "epoch": 18.88461966811449, "percentage": 94.42, "elapsed_time": "17:05:13", "remaining_time": "1:00:33", "throughput": 3351.99, "total_tokens": 206192016} +{"current_steps": 169570, "total_steps": 179580, "loss": 0.8554, "lr": 4.7183794677475577e-07, "epoch": 18.88517652299811, "percentage": 94.43, "elapsed_time": "17:05:15", "remaining_time": "1:00:31", "throughput": 3352.0, "total_tokens": 206198448} +{"current_steps": 169575, "total_steps": 179580, "loss": 0.8347, "lr": 4.713682313270462e-07, "epoch": 18.885733377881724, "percentage": 94.43, "elapsed_time": "17:05:16", "remaining_time": "1:00:29", "throughput": 3352.0, "total_tokens": 206204304} +{"current_steps": 169580, "total_steps": 179580, "loss": 0.5047, "lr": 4.708987475719101e-07, "epoch": 18.88629023276534, "percentage": 94.43, "elapsed_time": "17:05:18", "remaining_time": "1:00:27", "throughput": 3352.0, "total_tokens": 206210672} +{"current_steps": 169585, "total_steps": 179580, "loss": 0.9715, "lr": 4.704294955137939e-07, "epoch": 18.88684708764896, "percentage": 94.43, "elapsed_time": "17:05:20", "remaining_time": "1:00:25", "throughput": 3352.0, "total_tokens": 206216912} +{"current_steps": 169590, "total_steps": 179580, "loss": 0.5056, "lr": 4.6996047515711904e-07, "epoch": 18.887403942532575, "percentage": 94.44, "elapsed_time": "17:05:22", "remaining_time": "1:00:24", "throughput": 3352.01, "total_tokens": 206223152} +{"current_steps": 169595, "total_steps": 179580, "loss": 0.6968, "lr": 4.694916865063237e-07, "epoch": 18.887960797416195, "percentage": 94.44, "elapsed_time": "17:05:24", "remaining_time": "1:00:22", "throughput": 3352.01, "total_tokens": 206229328} +{"current_steps": 169600, "total_steps": 179580, "loss": 0.6694, "lr": 4.6902312956583206e-07, "epoch": 18.88851765229981, "percentage": 94.44, "elapsed_time": "17:05:25", "remaining_time": "1:00:20", "throughput": 3352.02, "total_tokens": 206235632} +{"current_steps": 169605, "total_steps": 179580, "loss": 0.6598, "lr": 4.6855480434007113e-07, "epoch": 18.889074507183427, "percentage": 94.45, "elapsed_time": "17:05:27", "remaining_time": "1:00:18", "throughput": 3352.02, "total_tokens": 206242032} +{"current_steps": 169610, "total_steps": 179580, "loss": 0.6022, "lr": 4.6808671083346246e-07, "epoch": 18.889631362067046, "percentage": 94.45, "elapsed_time": "17:05:29", "remaining_time": "1:00:16", "throughput": 3352.02, "total_tokens": 206248336} +{"current_steps": 169615, "total_steps": 179580, "loss": 0.7044, "lr": 4.676188490504302e-07, "epoch": 18.890188216950662, "percentage": 94.45, "elapsed_time": "17:05:31", "remaining_time": "1:00:15", "throughput": 3352.03, "total_tokens": 206254224} +{"current_steps": 169620, "total_steps": 179580, "loss": 0.7059, "lr": 4.671512189953958e-07, "epoch": 18.89074507183428, "percentage": 94.45, "elapsed_time": "17:05:33", "remaining_time": "1:00:13", "throughput": 3352.03, "total_tokens": 206260656} +{"current_steps": 169625, "total_steps": 179580, "loss": 0.8329, "lr": 4.666838206727697e-07, "epoch": 18.891301926717897, "percentage": 94.46, "elapsed_time": "17:05:34", "remaining_time": "1:00:11", "throughput": 3352.03, "total_tokens": 206266832} +{"current_steps": 169630, "total_steps": 179580, "loss": 0.5372, "lr": 4.662166540869706e-07, "epoch": 18.891858781601513, "percentage": 94.46, "elapsed_time": "17:05:36", "remaining_time": "1:00:09", "throughput": 3352.04, "total_tokens": 206273200} +{"current_steps": 169635, "total_steps": 179580, "loss": 0.7962, "lr": 4.657497192424143e-07, "epoch": 18.892415636485133, "percentage": 94.46, "elapsed_time": "17:05:38", "remaining_time": "1:00:07", "throughput": 3352.04, "total_tokens": 206279184} +{"current_steps": 169640, "total_steps": 179580, "loss": 0.6951, "lr": 4.6528301614350843e-07, "epoch": 18.89297249136875, "percentage": 94.46, "elapsed_time": "17:05:40", "remaining_time": "1:00:05", "throughput": 3352.04, "total_tokens": 206285104} +{"current_steps": 169645, "total_steps": 179580, "loss": 0.5045, "lr": 4.6481654479466065e-07, "epoch": 18.893529346252368, "percentage": 94.47, "elapsed_time": "17:05:41", "remaining_time": "1:00:04", "throughput": 3352.05, "total_tokens": 206291120} +{"current_steps": 169650, "total_steps": 179580, "loss": 0.7672, "lr": 4.643503052002757e-07, "epoch": 18.894086201135984, "percentage": 94.47, "elapsed_time": "17:05:43", "remaining_time": "1:00:02", "throughput": 3352.05, "total_tokens": 206297168} +{"current_steps": 169655, "total_steps": 179580, "loss": 0.8069, "lr": 4.6388429736476115e-07, "epoch": 18.8946430560196, "percentage": 94.47, "elapsed_time": "17:05:45", "remaining_time": "1:00:00", "throughput": 3352.05, "total_tokens": 206303408} +{"current_steps": 169660, "total_steps": 179580, "loss": 0.8715, "lr": 4.634185212925163e-07, "epoch": 18.89519991090322, "percentage": 94.48, "elapsed_time": "17:05:47", "remaining_time": "0:59:58", "throughput": 3352.06, "total_tokens": 206309520} +{"current_steps": 169665, "total_steps": 179580, "loss": 0.5716, "lr": 4.6295297698794317e-07, "epoch": 18.895756765786835, "percentage": 94.48, "elapsed_time": "17:05:48", "remaining_time": "0:59:56", "throughput": 3352.06, "total_tokens": 206315888} +{"current_steps": 169670, "total_steps": 179580, "loss": 0.6256, "lr": 4.6248766445543824e-07, "epoch": 18.896313620670455, "percentage": 94.48, "elapsed_time": "17:05:50", "remaining_time": "0:59:55", "throughput": 3352.06, "total_tokens": 206322128} +{"current_steps": 169675, "total_steps": 179580, "loss": 0.7953, "lr": 4.6202258369939797e-07, "epoch": 18.89687047555407, "percentage": 94.48, "elapsed_time": "17:05:52", "remaining_time": "0:59:53", "throughput": 3352.07, "total_tokens": 206328208} +{"current_steps": 169680, "total_steps": 179580, "loss": 0.7567, "lr": 4.615577347242106e-07, "epoch": 18.897427330437687, "percentage": 94.49, "elapsed_time": "17:05:54", "remaining_time": "0:59:51", "throughput": 3352.07, "total_tokens": 206333968} +{"current_steps": 169685, "total_steps": 179580, "loss": 0.6022, "lr": 4.6109311753427253e-07, "epoch": 18.897984185321306, "percentage": 94.49, "elapsed_time": "17:05:56", "remaining_time": "0:59:49", "throughput": 3352.07, "total_tokens": 206340304} +{"current_steps": 169690, "total_steps": 179580, "loss": 0.5518, "lr": 4.606287321339692e-07, "epoch": 18.898541040204922, "percentage": 94.49, "elapsed_time": "17:05:57", "remaining_time": "0:59:47", "throughput": 3352.08, "total_tokens": 206346256} +{"current_steps": 169695, "total_steps": 179580, "loss": 0.7912, "lr": 4.6016457852768866e-07, "epoch": 18.89909789508854, "percentage": 94.5, "elapsed_time": "17:05:59", "remaining_time": "0:59:45", "throughput": 3352.08, "total_tokens": 206352400} +{"current_steps": 169700, "total_steps": 179580, "loss": 0.6748, "lr": 4.5970065671981365e-07, "epoch": 18.899654749972157, "percentage": 94.5, "elapsed_time": "17:06:01", "remaining_time": "0:59:44", "throughput": 3352.08, "total_tokens": 206358800} +{"current_steps": 169705, "total_steps": 179580, "loss": 0.748, "lr": 4.592369667147295e-07, "epoch": 18.900211604855773, "percentage": 94.5, "elapsed_time": "17:06:03", "remaining_time": "0:59:42", "throughput": 3352.09, "total_tokens": 206364912} +{"current_steps": 169710, "total_steps": 179580, "loss": 0.747, "lr": 4.587735085168104e-07, "epoch": 18.900768459739393, "percentage": 94.5, "elapsed_time": "17:06:04", "remaining_time": "0:59:40", "throughput": 3352.09, "total_tokens": 206370864} +{"current_steps": 169715, "total_steps": 179580, "loss": 0.9794, "lr": 4.583102821304419e-07, "epoch": 18.90132531462301, "percentage": 94.51, "elapsed_time": "17:06:06", "remaining_time": "0:59:38", "throughput": 3352.09, "total_tokens": 206376592} +{"current_steps": 169720, "total_steps": 179580, "loss": 0.7219, "lr": 4.5784728755998983e-07, "epoch": 18.901882169506628, "percentage": 94.51, "elapsed_time": "17:06:08", "remaining_time": "0:59:36", "throughput": 3352.09, "total_tokens": 206382640} +{"current_steps": 169725, "total_steps": 179580, "loss": 0.6625, "lr": 4.5738452480983685e-07, "epoch": 18.902439024390244, "percentage": 94.51, "elapsed_time": "17:06:10", "remaining_time": "0:59:35", "throughput": 3352.1, "total_tokens": 206388752} +{"current_steps": 169730, "total_steps": 179580, "loss": 0.6033, "lr": 4.5692199388434885e-07, "epoch": 18.90299587927386, "percentage": 94.51, "elapsed_time": "17:06:11", "remaining_time": "0:59:33", "throughput": 3352.1, "total_tokens": 206394608} +{"current_steps": 169735, "total_steps": 179580, "loss": 0.7217, "lr": 4.564596947878974e-07, "epoch": 18.90355273415748, "percentage": 94.52, "elapsed_time": "17:06:13", "remaining_time": "0:59:31", "throughput": 3352.1, "total_tokens": 206400944} +{"current_steps": 169740, "total_steps": 179580, "loss": 0.7952, "lr": 4.5599762752484843e-07, "epoch": 18.904109589041095, "percentage": 94.52, "elapsed_time": "17:06:15", "remaining_time": "0:59:29", "throughput": 3352.1, "total_tokens": 206407120} +{"current_steps": 169745, "total_steps": 179580, "loss": 0.6598, "lr": 4.555357920995651e-07, "epoch": 18.904666443924715, "percentage": 94.52, "elapsed_time": "17:06:17", "remaining_time": "0:59:27", "throughput": 3352.11, "total_tokens": 206413264} +{"current_steps": 169750, "total_steps": 179580, "loss": 0.6677, "lr": 4.550741885164106e-07, "epoch": 18.90522329880833, "percentage": 94.53, "elapsed_time": "17:06:18", "remaining_time": "0:59:25", "throughput": 3352.11, "total_tokens": 206419504} +{"current_steps": 169755, "total_steps": 179580, "loss": 0.818, "lr": 4.546128167797453e-07, "epoch": 18.905780153691946, "percentage": 94.53, "elapsed_time": "17:06:20", "remaining_time": "0:59:24", "throughput": 3352.11, "total_tokens": 206425616} +{"current_steps": 169760, "total_steps": 179580, "loss": 0.7145, "lr": 4.541516768939297e-07, "epoch": 18.906337008575566, "percentage": 94.53, "elapsed_time": "17:06:22", "remaining_time": "0:59:22", "throughput": 3352.12, "total_tokens": 206431024} +{"current_steps": 169765, "total_steps": 179580, "loss": 0.6935, "lr": 4.5369076886331574e-07, "epoch": 18.90689386345918, "percentage": 94.53, "elapsed_time": "17:06:24", "remaining_time": "0:59:20", "throughput": 3352.12, "total_tokens": 206436976} +{"current_steps": 169770, "total_steps": 179580, "loss": 0.8493, "lr": 4.532300926922584e-07, "epoch": 18.9074507183428, "percentage": 94.54, "elapsed_time": "17:06:25", "remaining_time": "0:59:18", "throughput": 3352.12, "total_tokens": 206442448} +{"current_steps": 169775, "total_steps": 179580, "loss": 0.6003, "lr": 4.527696483851096e-07, "epoch": 18.908007573226417, "percentage": 94.54, "elapsed_time": "17:06:27", "remaining_time": "0:59:16", "throughput": 3352.12, "total_tokens": 206448400} +{"current_steps": 169780, "total_steps": 179580, "loss": 0.7992, "lr": 4.5230943594621597e-07, "epoch": 18.908564428110033, "percentage": 94.54, "elapsed_time": "17:06:29", "remaining_time": "0:59:15", "throughput": 3352.12, "total_tokens": 206454128} +{"current_steps": 169785, "total_steps": 179580, "loss": 0.7362, "lr": 4.518494553799324e-07, "epoch": 18.909121282993652, "percentage": 94.55, "elapsed_time": "17:06:30", "remaining_time": "0:59:13", "throughput": 3352.13, "total_tokens": 206460144} +{"current_steps": 169790, "total_steps": 179580, "loss": 0.5203, "lr": 4.5138970669059423e-07, "epoch": 18.90967813787727, "percentage": 94.55, "elapsed_time": "17:06:32", "remaining_time": "0:59:11", "throughput": 3352.13, "total_tokens": 206466320} +{"current_steps": 169795, "total_steps": 179580, "loss": 0.6469, "lr": 4.5093018988255076e-07, "epoch": 18.910234992760888, "percentage": 94.55, "elapsed_time": "17:06:34", "remaining_time": "0:59:09", "throughput": 3352.14, "total_tokens": 206472432} +{"current_steps": 169800, "total_steps": 179580, "loss": 0.6333, "lr": 4.5047090496013745e-07, "epoch": 18.910791847644504, "percentage": 94.55, "elapsed_time": "17:06:36", "remaining_time": "0:59:07", "throughput": 3352.14, "total_tokens": 206478704} +{"current_steps": 169805, "total_steps": 179580, "loss": 0.7144, "lr": 4.5001185192769524e-07, "epoch": 18.91134870252812, "percentage": 94.56, "elapsed_time": "17:06:37", "remaining_time": "0:59:05", "throughput": 3352.14, "total_tokens": 206484592} +{"current_steps": 169810, "total_steps": 179580, "loss": 0.7204, "lr": 4.495530307895623e-07, "epoch": 18.91190555741174, "percentage": 94.56, "elapsed_time": "17:06:39", "remaining_time": "0:59:04", "throughput": 3352.14, "total_tokens": 206490896} +{"current_steps": 169815, "total_steps": 179580, "loss": 0.7654, "lr": 4.490944415500714e-07, "epoch": 18.912462412295355, "percentage": 94.56, "elapsed_time": "17:06:41", "remaining_time": "0:59:02", "throughput": 3352.15, "total_tokens": 206497136} +{"current_steps": 169820, "total_steps": 179580, "loss": 0.651, "lr": 4.486360842135495e-07, "epoch": 18.913019267178974, "percentage": 94.57, "elapsed_time": "17:06:43", "remaining_time": "0:59:00", "throughput": 3352.15, "total_tokens": 206503344} +{"current_steps": 169825, "total_steps": 179580, "loss": 0.983, "lr": 4.481779587843321e-07, "epoch": 18.91357612206259, "percentage": 94.57, "elapsed_time": "17:06:45", "remaining_time": "0:58:58", "throughput": 3352.15, "total_tokens": 206509520} +{"current_steps": 169830, "total_steps": 179580, "loss": 0.9202, "lr": 4.4772006526674625e-07, "epoch": 18.914132976946206, "percentage": 94.57, "elapsed_time": "17:06:46", "remaining_time": "0:58:56", "throughput": 3352.16, "total_tokens": 206515920} +{"current_steps": 169835, "total_steps": 179580, "loss": 0.7398, "lr": 4.4726240366511354e-07, "epoch": 18.914689831829826, "percentage": 94.57, "elapsed_time": "17:06:48", "remaining_time": "0:58:55", "throughput": 3352.16, "total_tokens": 206522160} +{"current_steps": 169840, "total_steps": 179580, "loss": 0.8222, "lr": 4.468049739837582e-07, "epoch": 18.91524668671344, "percentage": 94.58, "elapsed_time": "17:06:50", "remaining_time": "0:58:53", "throughput": 3352.16, "total_tokens": 206527792} +{"current_steps": 169845, "total_steps": 179580, "loss": 0.6145, "lr": 4.4634777622700187e-07, "epoch": 18.91580354159706, "percentage": 94.58, "elapsed_time": "17:06:52", "remaining_time": "0:58:51", "throughput": 3352.17, "total_tokens": 206533840} +{"current_steps": 169850, "total_steps": 179580, "loss": 0.852, "lr": 4.4589081039916047e-07, "epoch": 18.916360396480677, "percentage": 94.58, "elapsed_time": "17:06:53", "remaining_time": "0:58:49", "throughput": 3352.17, "total_tokens": 206539792} +{"current_steps": 169855, "total_steps": 179580, "loss": 0.628, "lr": 4.4543407650455836e-07, "epoch": 18.916917251364296, "percentage": 94.58, "elapsed_time": "17:06:55", "remaining_time": "0:58:47", "throughput": 3352.17, "total_tokens": 206546096} +{"current_steps": 169860, "total_steps": 179580, "loss": 0.9586, "lr": 4.4497757454750044e-07, "epoch": 18.917474106247912, "percentage": 94.59, "elapsed_time": "17:06:57", "remaining_time": "0:58:45", "throughput": 3352.18, "total_tokens": 206551792} +{"current_steps": 169865, "total_steps": 179580, "loss": 0.6313, "lr": 4.445213045323027e-07, "epoch": 18.918030961131528, "percentage": 94.59, "elapsed_time": "17:06:59", "remaining_time": "0:58:44", "throughput": 3352.18, "total_tokens": 206558384} +{"current_steps": 169870, "total_steps": 179580, "loss": 0.7528, "lr": 4.440652664632755e-07, "epoch": 18.918587816015147, "percentage": 94.59, "elapsed_time": "17:07:00", "remaining_time": "0:58:42", "throughput": 3352.18, "total_tokens": 206564496} +{"current_steps": 169875, "total_steps": 179580, "loss": 0.6299, "lr": 4.436094603447266e-07, "epoch": 18.919144670898763, "percentage": 94.6, "elapsed_time": "17:07:02", "remaining_time": "0:58:40", "throughput": 3352.19, "total_tokens": 206570288} +{"current_steps": 169880, "total_steps": 179580, "loss": 0.6665, "lr": 4.431538861809581e-07, "epoch": 18.91970152578238, "percentage": 94.6, "elapsed_time": "17:07:04", "remaining_time": "0:58:38", "throughput": 3352.19, "total_tokens": 206576432} +{"current_steps": 169885, "total_steps": 179580, "loss": 0.6194, "lr": 4.426985439762804e-07, "epoch": 18.920258380666, "percentage": 94.6, "elapsed_time": "17:07:06", "remaining_time": "0:58:36", "throughput": 3352.19, "total_tokens": 206582512} +{"current_steps": 169890, "total_steps": 179580, "loss": 0.8225, "lr": 4.4224343373498736e-07, "epoch": 18.920815235549615, "percentage": 94.6, "elapsed_time": "17:07:07", "remaining_time": "0:58:35", "throughput": 3352.2, "total_tokens": 206588624} +{"current_steps": 169895, "total_steps": 179580, "loss": 0.9295, "lr": 4.417885554613782e-07, "epoch": 18.921372090433234, "percentage": 94.61, "elapsed_time": "17:07:09", "remaining_time": "0:58:33", "throughput": 3352.2, "total_tokens": 206594992} +{"current_steps": 169900, "total_steps": 179580, "loss": 0.7421, "lr": 4.4133390915975236e-07, "epoch": 18.92192894531685, "percentage": 94.61, "elapsed_time": "17:07:11", "remaining_time": "0:58:31", "throughput": 3352.21, "total_tokens": 206601200} +{"current_steps": 169905, "total_steps": 179580, "loss": 1.0529, "lr": 4.4087949483440636e-07, "epoch": 18.92248580020047, "percentage": 94.61, "elapsed_time": "17:07:13", "remaining_time": "0:58:29", "throughput": 3352.21, "total_tokens": 206607344} +{"current_steps": 169910, "total_steps": 179580, "loss": 0.8337, "lr": 4.404253124896285e-07, "epoch": 18.923042655084085, "percentage": 94.62, "elapsed_time": "17:07:15", "remaining_time": "0:58:27", "throughput": 3352.21, "total_tokens": 206613776} +{"current_steps": 169915, "total_steps": 179580, "loss": 0.6555, "lr": 4.399713621297097e-07, "epoch": 18.9235995099677, "percentage": 94.62, "elapsed_time": "17:07:16", "remaining_time": "0:58:25", "throughput": 3352.22, "total_tokens": 206620048} +{"current_steps": 169920, "total_steps": 179580, "loss": 0.5594, "lr": 4.39517643758941e-07, "epoch": 18.92415636485132, "percentage": 94.62, "elapsed_time": "17:07:18", "remaining_time": "0:58:24", "throughput": 3352.22, "total_tokens": 206626320} +{"current_steps": 169925, "total_steps": 179580, "loss": 0.6392, "lr": 4.390641573816023e-07, "epoch": 18.924713219734937, "percentage": 94.62, "elapsed_time": "17:07:20", "remaining_time": "0:58:22", "throughput": 3352.22, "total_tokens": 206632400} +{"current_steps": 169930, "total_steps": 179580, "loss": 0.6669, "lr": 4.3861090300198473e-07, "epoch": 18.925270074618556, "percentage": 94.63, "elapsed_time": "17:07:22", "remaining_time": "0:58:20", "throughput": 3352.23, "total_tokens": 206638704} +{"current_steps": 169935, "total_steps": 179580, "loss": 0.8568, "lr": 4.3815788062435967e-07, "epoch": 18.925826929502172, "percentage": 94.63, "elapsed_time": "17:07:23", "remaining_time": "0:58:18", "throughput": 3352.23, "total_tokens": 206644336} +{"current_steps": 169940, "total_steps": 179580, "loss": 0.647, "lr": 4.377050902530155e-07, "epoch": 18.926383784385788, "percentage": 94.63, "elapsed_time": "17:07:25", "remaining_time": "0:58:16", "throughput": 3352.23, "total_tokens": 206650448} +{"current_steps": 169945, "total_steps": 179580, "loss": 0.6393, "lr": 4.372525318922266e-07, "epoch": 18.926940639269407, "percentage": 94.63, "elapsed_time": "17:07:27", "remaining_time": "0:58:15", "throughput": 3352.23, "total_tokens": 206656432} +{"current_steps": 169950, "total_steps": 179580, "loss": 0.8661, "lr": 4.3680020554626446e-07, "epoch": 18.927497494153023, "percentage": 94.64, "elapsed_time": "17:07:29", "remaining_time": "0:58:13", "throughput": 3352.23, "total_tokens": 206662512} +{"current_steps": 169955, "total_steps": 179580, "loss": 0.8078, "lr": 4.363481112194062e-07, "epoch": 18.928054349036643, "percentage": 94.64, "elapsed_time": "17:07:30", "remaining_time": "0:58:11", "throughput": 3352.24, "total_tokens": 206668848} +{"current_steps": 169960, "total_steps": 179580, "loss": 0.4899, "lr": 4.3589624891592073e-07, "epoch": 18.92861120392026, "percentage": 94.64, "elapsed_time": "17:07:32", "remaining_time": "0:58:09", "throughput": 3352.24, "total_tokens": 206674992} +{"current_steps": 169965, "total_steps": 179580, "loss": 0.7773, "lr": 4.3544461864007126e-07, "epoch": 18.929168058803874, "percentage": 94.65, "elapsed_time": "17:07:34", "remaining_time": "0:58:07", "throughput": 3352.25, "total_tokens": 206681264} +{"current_steps": 169970, "total_steps": 179580, "loss": 0.6712, "lr": 4.349932203961321e-07, "epoch": 18.929724913687494, "percentage": 94.65, "elapsed_time": "17:07:36", "remaining_time": "0:58:06", "throughput": 3352.25, "total_tokens": 206687536} +{"current_steps": 169975, "total_steps": 179580, "loss": 0.5638, "lr": 4.345420541883638e-07, "epoch": 18.93028176857111, "percentage": 94.65, "elapsed_time": "17:07:38", "remaining_time": "0:58:04", "throughput": 3352.26, "total_tokens": 206693808} +{"current_steps": 169980, "total_steps": 179580, "loss": 0.9423, "lr": 4.3409112002102683e-07, "epoch": 18.93083862345473, "percentage": 94.65, "elapsed_time": "17:07:39", "remaining_time": "0:58:02", "throughput": 3352.26, "total_tokens": 206699888} +{"current_steps": 169985, "total_steps": 179580, "loss": 0.6094, "lr": 4.3364041789837885e-07, "epoch": 18.931395478338345, "percentage": 94.66, "elapsed_time": "17:07:41", "remaining_time": "0:58:00", "throughput": 3352.26, "total_tokens": 206705680} +{"current_steps": 169990, "total_steps": 179580, "loss": 0.6465, "lr": 4.331899478246804e-07, "epoch": 18.93195233322196, "percentage": 94.66, "elapsed_time": "17:07:43", "remaining_time": "0:57:58", "throughput": 3352.27, "total_tokens": 206711920} +{"current_steps": 169995, "total_steps": 179580, "loss": 0.6679, "lr": 4.3273970980418356e-07, "epoch": 18.93250918810558, "percentage": 94.66, "elapsed_time": "17:07:44", "remaining_time": "0:57:56", "throughput": 3352.27, "total_tokens": 206717392} +{"current_steps": 170000, "total_steps": 179580, "loss": 0.9174, "lr": 4.3228970384114887e-07, "epoch": 18.933066042989196, "percentage": 94.67, "elapsed_time": "17:07:46", "remaining_time": "0:57:55", "throughput": 3352.27, "total_tokens": 206723504} +{"current_steps": 170005, "total_steps": 179580, "loss": 0.5607, "lr": 4.318399299398146e-07, "epoch": 18.933622897872816, "percentage": 94.67, "elapsed_time": "17:07:48", "remaining_time": "0:57:53", "throughput": 3352.27, "total_tokens": 206729584} +{"current_steps": 170010, "total_steps": 179580, "loss": 0.5642, "lr": 4.3139038810443845e-07, "epoch": 18.93417975275643, "percentage": 94.67, "elapsed_time": "17:07:50", "remaining_time": "0:57:51", "throughput": 3352.28, "total_tokens": 206735504} +{"current_steps": 170015, "total_steps": 179580, "loss": 0.7605, "lr": 4.3094107833926424e-07, "epoch": 18.934736607640048, "percentage": 94.67, "elapsed_time": "17:07:51", "remaining_time": "0:57:49", "throughput": 3352.28, "total_tokens": 206741680} +{"current_steps": 170020, "total_steps": 179580, "loss": 0.8918, "lr": 4.304920006485358e-07, "epoch": 18.935293462523667, "percentage": 94.68, "elapsed_time": "17:07:53", "remaining_time": "0:57:47", "throughput": 3352.28, "total_tokens": 206747888} +{"current_steps": 170025, "total_steps": 179580, "loss": 0.6317, "lr": 4.3004315503649697e-07, "epoch": 18.935850317407283, "percentage": 94.68, "elapsed_time": "17:07:55", "remaining_time": "0:57:46", "throughput": 3352.29, "total_tokens": 206754064} +{"current_steps": 170030, "total_steps": 179580, "loss": 0.7951, "lr": 4.29594541507386e-07, "epoch": 18.936407172290902, "percentage": 94.68, "elapsed_time": "17:07:57", "remaining_time": "0:57:44", "throughput": 3352.29, "total_tokens": 206760336} +{"current_steps": 170035, "total_steps": 179580, "loss": 0.8599, "lr": 4.291461600654356e-07, "epoch": 18.93696402717452, "percentage": 94.68, "elapsed_time": "17:07:59", "remaining_time": "0:57:42", "throughput": 3352.29, "total_tokens": 206766448} +{"current_steps": 170040, "total_steps": 179580, "loss": 0.3818, "lr": 4.2869801071488967e-07, "epoch": 18.937520882058134, "percentage": 94.69, "elapsed_time": "17:08:00", "remaining_time": "0:57:40", "throughput": 3352.3, "total_tokens": 206772784} +{"current_steps": 170045, "total_steps": 179580, "loss": 0.6997, "lr": 4.2825009345997537e-07, "epoch": 18.938077736941754, "percentage": 94.69, "elapsed_time": "17:08:02", "remaining_time": "0:57:38", "throughput": 3352.3, "total_tokens": 206778640} +{"current_steps": 170050, "total_steps": 179580, "loss": 0.7171, "lr": 4.2780240830492536e-07, "epoch": 18.93863459182537, "percentage": 94.69, "elapsed_time": "17:08:04", "remaining_time": "0:57:36", "throughput": 3352.31, "total_tokens": 206784656} +{"current_steps": 170055, "total_steps": 179580, "loss": 0.6208, "lr": 4.2735495525396965e-07, "epoch": 18.93919144670899, "percentage": 94.7, "elapsed_time": "17:08:06", "remaining_time": "0:57:35", "throughput": 3352.31, "total_tokens": 206790544} +{"current_steps": 170060, "total_steps": 179580, "loss": 0.8053, "lr": 4.2690773431133256e-07, "epoch": 18.939748301592605, "percentage": 94.7, "elapsed_time": "17:08:07", "remaining_time": "0:57:33", "throughput": 3352.31, "total_tokens": 206796016} +{"current_steps": 170065, "total_steps": 179580, "loss": 0.678, "lr": 4.264607454812386e-07, "epoch": 18.94030515647622, "percentage": 94.7, "elapsed_time": "17:08:09", "remaining_time": "0:57:31", "throughput": 3352.31, "total_tokens": 206802384} +{"current_steps": 170070, "total_steps": 179580, "loss": 0.5596, "lr": 4.260139887679121e-07, "epoch": 18.94086201135984, "percentage": 94.7, "elapsed_time": "17:08:11", "remaining_time": "0:57:29", "throughput": 3352.31, "total_tokens": 206808528} +{"current_steps": 170075, "total_steps": 179580, "loss": 0.7566, "lr": 4.255674641755747e-07, "epoch": 18.941418866243456, "percentage": 94.71, "elapsed_time": "17:08:13", "remaining_time": "0:57:27", "throughput": 3352.32, "total_tokens": 206814608} +{"current_steps": 170080, "total_steps": 179580, "loss": 0.6204, "lr": 4.2512117170843967e-07, "epoch": 18.941975721127076, "percentage": 94.71, "elapsed_time": "17:08:14", "remaining_time": "0:57:26", "throughput": 3352.32, "total_tokens": 206820592} +{"current_steps": 170085, "total_steps": 179580, "loss": 0.8967, "lr": 4.2467511137072034e-07, "epoch": 18.94253257601069, "percentage": 94.71, "elapsed_time": "17:08:16", "remaining_time": "0:57:24", "throughput": 3352.32, "total_tokens": 206826672} +{"current_steps": 170090, "total_steps": 179580, "loss": 0.7993, "lr": 4.2422928316663835e-07, "epoch": 18.943089430894307, "percentage": 94.72, "elapsed_time": "17:08:18", "remaining_time": "0:57:22", "throughput": 3352.33, "total_tokens": 206832752} +{"current_steps": 170095, "total_steps": 179580, "loss": 0.4425, "lr": 4.2378368710039864e-07, "epoch": 18.943646285777927, "percentage": 94.72, "elapsed_time": "17:08:20", "remaining_time": "0:57:20", "throughput": 3352.33, "total_tokens": 206838992} +{"current_steps": 170100, "total_steps": 179580, "loss": 1.0784, "lr": 4.233383231762145e-07, "epoch": 18.944203140661543, "percentage": 94.72, "elapsed_time": "17:08:21", "remaining_time": "0:57:18", "throughput": 3352.33, "total_tokens": 206845168} +{"current_steps": 170105, "total_steps": 179580, "loss": 0.6165, "lr": 4.228931913982853e-07, "epoch": 18.944759995545162, "percentage": 94.72, "elapsed_time": "17:08:23", "remaining_time": "0:57:16", "throughput": 3352.34, "total_tokens": 206851056} +{"current_steps": 170110, "total_steps": 179580, "loss": 0.7156, "lr": 4.2244829177082446e-07, "epoch": 18.945316850428778, "percentage": 94.73, "elapsed_time": "17:08:25", "remaining_time": "0:57:15", "throughput": 3352.34, "total_tokens": 206857264} +{"current_steps": 170115, "total_steps": 179580, "loss": 0.8676, "lr": 4.220036242980313e-07, "epoch": 18.945873705312394, "percentage": 94.73, "elapsed_time": "17:08:26", "remaining_time": "0:57:13", "throughput": 3352.34, "total_tokens": 206862576} +{"current_steps": 170120, "total_steps": 179580, "loss": 0.7379, "lr": 4.215591889841053e-07, "epoch": 18.946430560196013, "percentage": 94.73, "elapsed_time": "17:08:28", "remaining_time": "0:57:11", "throughput": 3352.34, "total_tokens": 206868880} +{"current_steps": 170125, "total_steps": 179580, "loss": 0.5812, "lr": 4.2111498583324306e-07, "epoch": 18.94698741507963, "percentage": 94.73, "elapsed_time": "17:08:30", "remaining_time": "0:57:09", "throughput": 3352.35, "total_tokens": 206874320} +{"current_steps": 170130, "total_steps": 179580, "loss": 0.7887, "lr": 4.2067101484964397e-07, "epoch": 18.94754426996325, "percentage": 94.74, "elapsed_time": "17:08:32", "remaining_time": "0:57:07", "throughput": 3352.35, "total_tokens": 206880304} +{"current_steps": 170135, "total_steps": 179580, "loss": 0.8311, "lr": 4.2022727603749647e-07, "epoch": 18.948101124846865, "percentage": 94.74, "elapsed_time": "17:08:33", "remaining_time": "0:57:06", "throughput": 3352.35, "total_tokens": 206886256} +{"current_steps": 170140, "total_steps": 179580, "loss": 0.895, "lr": 4.197837694009971e-07, "epoch": 18.94865797973048, "percentage": 94.74, "elapsed_time": "17:08:35", "remaining_time": "0:57:04", "throughput": 3352.35, "total_tokens": 206892560} +{"current_steps": 170145, "total_steps": 179580, "loss": 0.6052, "lr": 4.1934049494433415e-07, "epoch": 18.9492148346141, "percentage": 94.75, "elapsed_time": "17:08:37", "remaining_time": "0:57:02", "throughput": 3352.36, "total_tokens": 206898640} +{"current_steps": 170150, "total_steps": 179580, "loss": 0.6383, "lr": 4.18897452671696e-07, "epoch": 18.949771689497716, "percentage": 94.75, "elapsed_time": "17:08:39", "remaining_time": "0:57:00", "throughput": 3352.36, "total_tokens": 206904496} +{"current_steps": 170155, "total_steps": 179580, "loss": 0.4754, "lr": 4.1845464258725985e-07, "epoch": 18.950328544381335, "percentage": 94.75, "elapsed_time": "17:08:40", "remaining_time": "0:56:58", "throughput": 3352.36, "total_tokens": 206910960} +{"current_steps": 170160, "total_steps": 179580, "loss": 0.5409, "lr": 4.180120646952196e-07, "epoch": 18.95088539926495, "percentage": 94.75, "elapsed_time": "17:08:42", "remaining_time": "0:56:56", "throughput": 3352.37, "total_tokens": 206916784} +{"current_steps": 170165, "total_steps": 179580, "loss": 0.5968, "lr": 4.1756971899974683e-07, "epoch": 18.951442254148567, "percentage": 94.76, "elapsed_time": "17:08:44", "remaining_time": "0:56:55", "throughput": 3352.37, "total_tokens": 206922832} +{"current_steps": 170170, "total_steps": 179580, "loss": 0.5099, "lr": 4.171276055050244e-07, "epoch": 18.951999109032187, "percentage": 94.76, "elapsed_time": "17:08:46", "remaining_time": "0:56:53", "throughput": 3352.37, "total_tokens": 206928784} +{"current_steps": 170175, "total_steps": 179580, "loss": 0.6211, "lr": 4.166857242152267e-07, "epoch": 18.952555963915803, "percentage": 94.76, "elapsed_time": "17:08:47", "remaining_time": "0:56:51", "throughput": 3352.38, "total_tokens": 206935024} +{"current_steps": 170180, "total_steps": 179580, "loss": 0.7021, "lr": 4.1624407513452814e-07, "epoch": 18.953112818799422, "percentage": 94.77, "elapsed_time": "17:08:49", "remaining_time": "0:56:49", "throughput": 3352.38, "total_tokens": 206941296} +{"current_steps": 170185, "total_steps": 179580, "loss": 0.7377, "lr": 4.158026582670976e-07, "epoch": 18.953669673683038, "percentage": 94.77, "elapsed_time": "17:08:51", "remaining_time": "0:56:47", "throughput": 3352.38, "total_tokens": 206947056} +{"current_steps": 170190, "total_steps": 179580, "loss": 0.5804, "lr": 4.153614736171152e-07, "epoch": 18.954226528566657, "percentage": 94.77, "elapsed_time": "17:08:53", "remaining_time": "0:56:46", "throughput": 3352.38, "total_tokens": 206953072} +{"current_steps": 170195, "total_steps": 179580, "loss": 0.7471, "lr": 4.14920521188733e-07, "epoch": 18.954783383450273, "percentage": 94.77, "elapsed_time": "17:08:54", "remaining_time": "0:56:44", "throughput": 3352.38, "total_tokens": 206959280} +{"current_steps": 170200, "total_steps": 179580, "loss": 0.7177, "lr": 4.1447980098612836e-07, "epoch": 18.95534023833389, "percentage": 94.78, "elapsed_time": "17:08:56", "remaining_time": "0:56:42", "throughput": 3352.39, "total_tokens": 206965744} +{"current_steps": 170205, "total_steps": 179580, "loss": 0.7864, "lr": 4.1403931301345625e-07, "epoch": 18.95589709321751, "percentage": 94.78, "elapsed_time": "17:08:58", "remaining_time": "0:56:40", "throughput": 3352.39, "total_tokens": 206971888} +{"current_steps": 170210, "total_steps": 179580, "loss": 1.0406, "lr": 4.135990572748827e-07, "epoch": 18.956453948101124, "percentage": 94.78, "elapsed_time": "17:09:00", "remaining_time": "0:56:38", "throughput": 3352.39, "total_tokens": 206978064} +{"current_steps": 170215, "total_steps": 179580, "loss": 0.963, "lr": 4.1315903377456553e-07, "epoch": 18.95701080298474, "percentage": 94.79, "elapsed_time": "17:09:02", "remaining_time": "0:56:36", "throughput": 3352.4, "total_tokens": 206984208} +{"current_steps": 170220, "total_steps": 179580, "loss": 0.6314, "lr": 4.1271924251665707e-07, "epoch": 18.95756765786836, "percentage": 94.79, "elapsed_time": "17:09:03", "remaining_time": "0:56:35", "throughput": 3352.4, "total_tokens": 206990192} +{"current_steps": 170225, "total_steps": 179580, "loss": 0.8582, "lr": 4.1227968350531497e-07, "epoch": 18.958124512751976, "percentage": 94.79, "elapsed_time": "17:09:05", "remaining_time": "0:56:33", "throughput": 3352.41, "total_tokens": 206996624} +{"current_steps": 170230, "total_steps": 179580, "loss": 0.5736, "lr": 4.1184035674469155e-07, "epoch": 18.958681367635595, "percentage": 94.79, "elapsed_time": "17:09:07", "remaining_time": "0:56:31", "throughput": 3352.41, "total_tokens": 207002512} +{"current_steps": 170235, "total_steps": 179580, "loss": 0.9015, "lr": 4.1140126223893626e-07, "epoch": 18.95923822251921, "percentage": 94.8, "elapsed_time": "17:09:09", "remaining_time": "0:56:29", "throughput": 3352.41, "total_tokens": 207008976} +{"current_steps": 170240, "total_steps": 179580, "loss": 0.553, "lr": 4.1096239999219575e-07, "epoch": 18.95979507740283, "percentage": 94.8, "elapsed_time": "17:09:10", "remaining_time": "0:56:27", "throughput": 3352.42, "total_tokens": 207014672} +{"current_steps": 170245, "total_steps": 179580, "loss": 0.7701, "lr": 4.1052377000861397e-07, "epoch": 18.960351932286446, "percentage": 94.8, "elapsed_time": "17:09:12", "remaining_time": "0:56:26", "throughput": 3352.42, "total_tokens": 207020016} +{"current_steps": 170250, "total_steps": 179580, "loss": 0.8436, "lr": 4.100853722923376e-07, "epoch": 18.960908787170062, "percentage": 94.8, "elapsed_time": "17:09:14", "remaining_time": "0:56:24", "throughput": 3352.42, "total_tokens": 207026256} +{"current_steps": 170255, "total_steps": 179580, "loss": 0.683, "lr": 4.096472068475049e-07, "epoch": 18.961465642053682, "percentage": 94.81, "elapsed_time": "17:09:15", "remaining_time": "0:56:22", "throughput": 3352.42, "total_tokens": 207032208} +{"current_steps": 170260, "total_steps": 179580, "loss": 0.8018, "lr": 4.092092736782599e-07, "epoch": 18.962022496937298, "percentage": 94.81, "elapsed_time": "17:09:17", "remaining_time": "0:56:20", "throughput": 3352.43, "total_tokens": 207038192} +{"current_steps": 170265, "total_steps": 179580, "loss": 0.7214, "lr": 4.087715727887298e-07, "epoch": 18.962579351820917, "percentage": 94.81, "elapsed_time": "17:09:19", "remaining_time": "0:56:18", "throughput": 3352.43, "total_tokens": 207044208} +{"current_steps": 170270, "total_steps": 179580, "loss": 0.733, "lr": 4.0833410418305575e-07, "epoch": 18.963136206704533, "percentage": 94.82, "elapsed_time": "17:09:21", "remaining_time": "0:56:16", "throughput": 3352.43, "total_tokens": 207050512} +{"current_steps": 170275, "total_steps": 179580, "loss": 0.7566, "lr": 4.0789686786536773e-07, "epoch": 18.96369306158815, "percentage": 94.82, "elapsed_time": "17:09:23", "remaining_time": "0:56:15", "throughput": 3352.43, "total_tokens": 207056368} +{"current_steps": 170280, "total_steps": 179580, "loss": 0.6348, "lr": 4.074598638397986e-07, "epoch": 18.96424991647177, "percentage": 94.82, "elapsed_time": "17:09:24", "remaining_time": "0:56:13", "throughput": 3352.44, "total_tokens": 207062608} +{"current_steps": 170285, "total_steps": 179580, "loss": 0.6804, "lr": 4.0702309211047564e-07, "epoch": 18.964806771355384, "percentage": 94.82, "elapsed_time": "17:09:26", "remaining_time": "0:56:11", "throughput": 3352.44, "total_tokens": 207068944} +{"current_steps": 170290, "total_steps": 179580, "loss": 0.5772, "lr": 4.0658655268152046e-07, "epoch": 18.965363626239004, "percentage": 94.83, "elapsed_time": "17:09:28", "remaining_time": "0:56:09", "throughput": 3352.44, "total_tokens": 207075024} +{"current_steps": 170295, "total_steps": 179580, "loss": 0.8948, "lr": 4.061502455570604e-07, "epoch": 18.96592048112262, "percentage": 94.83, "elapsed_time": "17:09:30", "remaining_time": "0:56:07", "throughput": 3352.45, "total_tokens": 207080784} +{"current_steps": 170300, "total_steps": 179580, "loss": 0.6129, "lr": 4.057141707412143e-07, "epoch": 18.966477336006236, "percentage": 94.83, "elapsed_time": "17:09:31", "remaining_time": "0:56:06", "throughput": 3352.45, "total_tokens": 207087056} +{"current_steps": 170305, "total_steps": 179580, "loss": 0.6208, "lr": 4.05278328238104e-07, "epoch": 18.967034190889855, "percentage": 94.84, "elapsed_time": "17:09:33", "remaining_time": "0:56:04", "throughput": 3352.45, "total_tokens": 207093296} +{"current_steps": 170310, "total_steps": 179580, "loss": 0.846, "lr": 4.048427180518455e-07, "epoch": 18.96759104577347, "percentage": 94.84, "elapsed_time": "17:09:35", "remaining_time": "0:56:02", "throughput": 3352.45, "total_tokens": 207098800} +{"current_steps": 170315, "total_steps": 179580, "loss": 0.5925, "lr": 4.044073401865522e-07, "epoch": 18.96814790065709, "percentage": 94.84, "elapsed_time": "17:09:37", "remaining_time": "0:56:00", "throughput": 3352.46, "total_tokens": 207104880} +{"current_steps": 170320, "total_steps": 179580, "loss": 0.6625, "lr": 4.0397219464633484e-07, "epoch": 18.968704755540706, "percentage": 94.84, "elapsed_time": "17:09:38", "remaining_time": "0:55:58", "throughput": 3352.46, "total_tokens": 207111280} +{"current_steps": 170325, "total_steps": 179580, "loss": 0.7013, "lr": 4.0353728143530946e-07, "epoch": 18.969261610424322, "percentage": 94.85, "elapsed_time": "17:09:40", "remaining_time": "0:55:56", "throughput": 3352.46, "total_tokens": 207117168} +{"current_steps": 170330, "total_steps": 179580, "loss": 0.8786, "lr": 4.0310260055757554e-07, "epoch": 18.96981846530794, "percentage": 94.85, "elapsed_time": "17:09:42", "remaining_time": "0:55:55", "throughput": 3352.46, "total_tokens": 207123440} +{"current_steps": 170335, "total_steps": 179580, "loss": 0.6875, "lr": 4.0266815201725206e-07, "epoch": 18.970375320191557, "percentage": 94.85, "elapsed_time": "17:09:44", "remaining_time": "0:55:53", "throughput": 3352.47, "total_tokens": 207129776} +{"current_steps": 170340, "total_steps": 179580, "loss": 0.8261, "lr": 4.022339358184302e-07, "epoch": 18.970932175075177, "percentage": 94.85, "elapsed_time": "17:09:46", "remaining_time": "0:55:51", "throughput": 3352.47, "total_tokens": 207136208} +{"current_steps": 170345, "total_steps": 179580, "loss": 0.7364, "lr": 4.017999519652149e-07, "epoch": 18.971489029958793, "percentage": 94.86, "elapsed_time": "17:09:47", "remaining_time": "0:55:49", "throughput": 3352.48, "total_tokens": 207142288} +{"current_steps": 170350, "total_steps": 179580, "loss": 0.7361, "lr": 4.013662004617086e-07, "epoch": 18.97204588484241, "percentage": 94.86, "elapsed_time": "17:09:49", "remaining_time": "0:55:47", "throughput": 3352.48, "total_tokens": 207148272} +{"current_steps": 170355, "total_steps": 179580, "loss": 0.6249, "lr": 4.009326813120079e-07, "epoch": 18.972602739726028, "percentage": 94.86, "elapsed_time": "17:09:51", "remaining_time": "0:55:46", "throughput": 3352.48, "total_tokens": 207154544} +{"current_steps": 170360, "total_steps": 179580, "loss": 0.9752, "lr": 4.004993945202068e-07, "epoch": 18.973159594609644, "percentage": 94.87, "elapsed_time": "17:09:53", "remaining_time": "0:55:44", "throughput": 3352.49, "total_tokens": 207160592} +{"current_steps": 170365, "total_steps": 179580, "loss": 0.881, "lr": 4.0006634009039643e-07, "epoch": 18.973716449493264, "percentage": 94.87, "elapsed_time": "17:09:54", "remaining_time": "0:55:42", "throughput": 3352.49, "total_tokens": 207165968} +{"current_steps": 170370, "total_steps": 179580, "loss": 0.8005, "lr": 3.996335180266653e-07, "epoch": 18.97427330437688, "percentage": 94.87, "elapsed_time": "17:09:56", "remaining_time": "0:55:40", "throughput": 3352.49, "total_tokens": 207172048} +{"current_steps": 170375, "total_steps": 179580, "loss": 0.6446, "lr": 3.9920092833310995e-07, "epoch": 18.974830159260495, "percentage": 94.87, "elapsed_time": "17:09:58", "remaining_time": "0:55:38", "throughput": 3352.49, "total_tokens": 207178352} +{"current_steps": 170380, "total_steps": 179580, "loss": 0.7397, "lr": 3.987685710138106e-07, "epoch": 18.975387014144115, "percentage": 94.88, "elapsed_time": "17:10:00", "remaining_time": "0:55:37", "throughput": 3352.5, "total_tokens": 207184400} +{"current_steps": 170385, "total_steps": 179580, "loss": 0.7349, "lr": 3.983364460728528e-07, "epoch": 18.97594386902773, "percentage": 94.88, "elapsed_time": "17:10:01", "remaining_time": "0:55:35", "throughput": 3352.5, "total_tokens": 207190480} +{"current_steps": 170390, "total_steps": 179580, "loss": 0.4886, "lr": 3.979045535143139e-07, "epoch": 18.97650072391135, "percentage": 94.88, "elapsed_time": "17:10:03", "remaining_time": "0:55:33", "throughput": 3352.5, "total_tokens": 207196560} +{"current_steps": 170395, "total_steps": 179580, "loss": 1.0564, "lr": 3.9747289334227943e-07, "epoch": 18.977057578794966, "percentage": 94.89, "elapsed_time": "17:10:05", "remaining_time": "0:55:31", "throughput": 3352.51, "total_tokens": 207202800} +{"current_steps": 170400, "total_steps": 179580, "loss": 0.5261, "lr": 3.97041465560824e-07, "epoch": 18.977614433678582, "percentage": 94.89, "elapsed_time": "17:10:07", "remaining_time": "0:55:29", "throughput": 3352.51, "total_tokens": 207208976} +{"current_steps": 170405, "total_steps": 179580, "loss": 0.7084, "lr": 3.966102701740276e-07, "epoch": 18.9781712885622, "percentage": 94.89, "elapsed_time": "17:10:08", "remaining_time": "0:55:27", "throughput": 3352.51, "total_tokens": 207214608} +{"current_steps": 170410, "total_steps": 179580, "loss": 0.7793, "lr": 3.961793071859565e-07, "epoch": 18.978728143445817, "percentage": 94.89, "elapsed_time": "17:10:10", "remaining_time": "0:55:26", "throughput": 3352.51, "total_tokens": 207220080} +{"current_steps": 170415, "total_steps": 179580, "loss": 0.6058, "lr": 3.957485766006824e-07, "epoch": 18.979284998329437, "percentage": 94.9, "elapsed_time": "17:10:12", "remaining_time": "0:55:24", "throughput": 3352.52, "total_tokens": 207226320} +{"current_steps": 170420, "total_steps": 179580, "loss": 0.4934, "lr": 3.953180784222771e-07, "epoch": 18.979841853213053, "percentage": 94.9, "elapsed_time": "17:10:13", "remaining_time": "0:55:22", "throughput": 3352.52, "total_tokens": 207232272} +{"current_steps": 170425, "total_steps": 179580, "loss": 0.8722, "lr": 3.9488781265480667e-07, "epoch": 18.98039870809667, "percentage": 94.9, "elapsed_time": "17:10:15", "remaining_time": "0:55:20", "throughput": 3352.52, "total_tokens": 207238512} +{"current_steps": 170430, "total_steps": 179580, "loss": 0.9102, "lr": 3.9445777930233183e-07, "epoch": 18.980955562980288, "percentage": 94.9, "elapsed_time": "17:10:17", "remaining_time": "0:55:18", "throughput": 3352.52, "total_tokens": 207244400} +{"current_steps": 170435, "total_steps": 179580, "loss": 0.5813, "lr": 3.940279783689188e-07, "epoch": 18.981512417863904, "percentage": 94.91, "elapsed_time": "17:10:19", "remaining_time": "0:55:17", "throughput": 3352.53, "total_tokens": 207250512} +{"current_steps": 170440, "total_steps": 179580, "loss": 0.5943, "lr": 3.935984098586226e-07, "epoch": 18.982069272747523, "percentage": 94.91, "elapsed_time": "17:10:20", "remaining_time": "0:55:15", "throughput": 3352.53, "total_tokens": 207256176} +{"current_steps": 170445, "total_steps": 179580, "loss": 0.637, "lr": 3.931690737755067e-07, "epoch": 18.98262612763114, "percentage": 94.91, "elapsed_time": "17:10:22", "remaining_time": "0:55:13", "throughput": 3352.53, "total_tokens": 207262320} +{"current_steps": 170450, "total_steps": 179580, "loss": 0.5666, "lr": 3.927399701236234e-07, "epoch": 18.983182982514755, "percentage": 94.92, "elapsed_time": "17:10:24", "remaining_time": "0:55:11", "throughput": 3352.54, "total_tokens": 207268496} +{"current_steps": 170455, "total_steps": 179580, "loss": 0.6643, "lr": 3.9231109890702777e-07, "epoch": 18.983739837398375, "percentage": 94.92, "elapsed_time": "17:10:26", "remaining_time": "0:55:09", "throughput": 3352.54, "total_tokens": 207274704} +{"current_steps": 170460, "total_steps": 179580, "loss": 0.7801, "lr": 3.918824601297638e-07, "epoch": 18.98429669228199, "percentage": 94.92, "elapsed_time": "17:10:27", "remaining_time": "0:55:07", "throughput": 3352.54, "total_tokens": 207280528} +{"current_steps": 170465, "total_steps": 179580, "loss": 0.647, "lr": 3.914540537958894e-07, "epoch": 18.98485354716561, "percentage": 94.92, "elapsed_time": "17:10:29", "remaining_time": "0:55:06", "throughput": 3352.54, "total_tokens": 207286608} +{"current_steps": 170470, "total_steps": 179580, "loss": 0.8286, "lr": 3.9102587990944573e-07, "epoch": 18.985410402049226, "percentage": 94.93, "elapsed_time": "17:10:31", "remaining_time": "0:55:04", "throughput": 3352.55, "total_tokens": 207292592} +{"current_steps": 170475, "total_steps": 179580, "loss": 0.6117, "lr": 3.905979384744796e-07, "epoch": 18.98596725693284, "percentage": 94.93, "elapsed_time": "17:10:33", "remaining_time": "0:55:02", "throughput": 3352.55, "total_tokens": 207298864} +{"current_steps": 170480, "total_steps": 179580, "loss": 0.7466, "lr": 3.901702294950349e-07, "epoch": 18.98652411181646, "percentage": 94.93, "elapsed_time": "17:10:34", "remaining_time": "0:55:00", "throughput": 3352.55, "total_tokens": 207305104} +{"current_steps": 170485, "total_steps": 179580, "loss": 0.9573, "lr": 3.897427529751474e-07, "epoch": 18.987080966700077, "percentage": 94.94, "elapsed_time": "17:10:36", "remaining_time": "0:54:58", "throughput": 3352.56, "total_tokens": 207311088} +{"current_steps": 170490, "total_steps": 179580, "loss": 0.5852, "lr": 3.8931550891885547e-07, "epoch": 18.987637821583697, "percentage": 94.94, "elapsed_time": "17:10:38", "remaining_time": "0:54:57", "throughput": 3352.56, "total_tokens": 207317296} +{"current_steps": 170495, "total_steps": 179580, "loss": 1.0493, "lr": 3.8888849733020037e-07, "epoch": 18.988194676467312, "percentage": 94.94, "elapsed_time": "17:10:40", "remaining_time": "0:54:55", "throughput": 3352.56, "total_tokens": 207323536} +{"current_steps": 170500, "total_steps": 179580, "loss": 0.7832, "lr": 3.8846171821320943e-07, "epoch": 18.98875153135093, "percentage": 94.94, "elapsed_time": "17:10:41", "remaining_time": "0:54:53", "throughput": 3352.57, "total_tokens": 207329392} +{"current_steps": 170505, "total_steps": 179580, "loss": 0.7318, "lr": 3.880351715719155e-07, "epoch": 18.989308386234548, "percentage": 94.95, "elapsed_time": "17:10:43", "remaining_time": "0:54:51", "throughput": 3352.57, "total_tokens": 207335216} +{"current_steps": 170510, "total_steps": 179580, "loss": 0.811, "lr": 3.876088574103487e-07, "epoch": 18.989865241118164, "percentage": 94.95, "elapsed_time": "17:10:45", "remaining_time": "0:54:49", "throughput": 3352.57, "total_tokens": 207341072} +{"current_steps": 170515, "total_steps": 179580, "loss": 0.9575, "lr": 3.871827757325336e-07, "epoch": 18.990422096001783, "percentage": 94.95, "elapsed_time": "17:10:47", "remaining_time": "0:54:47", "throughput": 3352.57, "total_tokens": 207347344} +{"current_steps": 170520, "total_steps": 179580, "loss": 0.6176, "lr": 3.867569265424975e-07, "epoch": 18.9909789508854, "percentage": 94.95, "elapsed_time": "17:10:49", "remaining_time": "0:54:46", "throughput": 3352.58, "total_tokens": 207353872} +{"current_steps": 170525, "total_steps": 179580, "loss": 0.6659, "lr": 3.8633130984426503e-07, "epoch": 18.991535805769015, "percentage": 94.96, "elapsed_time": "17:10:50", "remaining_time": "0:54:44", "throughput": 3352.58, "total_tokens": 207359792} +{"current_steps": 170530, "total_steps": 179580, "loss": 0.6148, "lr": 3.8590592564184957e-07, "epoch": 18.992092660652634, "percentage": 94.96, "elapsed_time": "17:10:52", "remaining_time": "0:54:42", "throughput": 3352.58, "total_tokens": 207366032} +{"current_steps": 170535, "total_steps": 179580, "loss": 0.6364, "lr": 3.854807739392757e-07, "epoch": 18.99264951553625, "percentage": 94.96, "elapsed_time": "17:10:54", "remaining_time": "0:54:40", "throughput": 3352.58, "total_tokens": 207371952} +{"current_steps": 170540, "total_steps": 179580, "loss": 0.598, "lr": 3.8505585474055416e-07, "epoch": 18.99320637041987, "percentage": 94.97, "elapsed_time": "17:10:56", "remaining_time": "0:54:38", "throughput": 3352.59, "total_tokens": 207378096} +{"current_steps": 170545, "total_steps": 179580, "loss": 0.6049, "lr": 3.846311680497039e-07, "epoch": 18.993763225303486, "percentage": 94.97, "elapsed_time": "17:10:58", "remaining_time": "0:54:37", "throughput": 3352.59, "total_tokens": 207384624} +{"current_steps": 170550, "total_steps": 179580, "loss": 0.639, "lr": 3.8420671387073283e-07, "epoch": 18.9943200801871, "percentage": 94.97, "elapsed_time": "17:10:59", "remaining_time": "0:54:35", "throughput": 3352.59, "total_tokens": 207390192} +{"current_steps": 170555, "total_steps": 179580, "loss": 0.6893, "lr": 3.837824922076516e-07, "epoch": 18.99487693507072, "percentage": 94.97, "elapsed_time": "17:11:01", "remaining_time": "0:54:33", "throughput": 3352.6, "total_tokens": 207396400} +{"current_steps": 170560, "total_steps": 179580, "loss": 0.8023, "lr": 3.8335850306446544e-07, "epoch": 18.995433789954337, "percentage": 94.98, "elapsed_time": "17:11:02", "remaining_time": "0:54:31", "throughput": 3352.6, "total_tokens": 207401712} +{"current_steps": 170565, "total_steps": 179580, "loss": 0.6682, "lr": 3.829347464451821e-07, "epoch": 18.995990644837956, "percentage": 94.98, "elapsed_time": "17:11:04", "remaining_time": "0:54:29", "throughput": 3352.6, "total_tokens": 207407888} +{"current_steps": 170570, "total_steps": 179580, "loss": 0.7824, "lr": 3.825112223538041e-07, "epoch": 18.996547499721572, "percentage": 94.98, "elapsed_time": "17:11:06", "remaining_time": "0:54:27", "throughput": 3352.6, "total_tokens": 207414256} +{"current_steps": 170575, "total_steps": 179580, "loss": 0.4925, "lr": 3.8208793079432813e-07, "epoch": 18.99710435460519, "percentage": 94.99, "elapsed_time": "17:11:08", "remaining_time": "0:54:26", "throughput": 3352.61, "total_tokens": 207420816} +{"current_steps": 170580, "total_steps": 179580, "loss": 0.7681, "lr": 3.816648717707566e-07, "epoch": 18.997661209488808, "percentage": 94.99, "elapsed_time": "17:11:10", "remaining_time": "0:54:24", "throughput": 3352.61, "total_tokens": 207426704} +{"current_steps": 170585, "total_steps": 179580, "loss": 0.9746, "lr": 3.812420452870835e-07, "epoch": 18.998218064372423, "percentage": 94.99, "elapsed_time": "17:11:11", "remaining_time": "0:54:22", "throughput": 3352.61, "total_tokens": 207432720} +{"current_steps": 170590, "total_steps": 179580, "loss": 0.5615, "lr": 3.808194513473029e-07, "epoch": 18.998774919256043, "percentage": 94.99, "elapsed_time": "17:11:13", "remaining_time": "0:54:20", "throughput": 3352.61, "total_tokens": 207438480} +{"current_steps": 170595, "total_steps": 179580, "loss": 0.6125, "lr": 3.803970899554116e-07, "epoch": 18.99933177413966, "percentage": 95.0, "elapsed_time": "17:11:15", "remaining_time": "0:54:18", "throughput": 3352.62, "total_tokens": 207444784} +{"current_steps": 170600, "total_steps": 179580, "loss": 0.8867, "lr": 3.7997496111538963e-07, "epoch": 18.99988862902328, "percentage": 95.0, "elapsed_time": "17:11:17", "remaining_time": "0:54:17", "throughput": 3352.62, "total_tokens": 207450832} +{"current_steps": 170601, "total_steps": 179580, "eval_loss": 0.7087222337722778, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "17:13:07", "remaining_time": "0:54:22", "throughput": 3346.67, "total_tokens": 207451408} +{"current_steps": 170605, "total_steps": 179580, "loss": 0.6404, "lr": 3.795530648312312e-07, "epoch": 19.000445483906894, "percentage": 95.0, "elapsed_time": "17:13:11", "remaining_time": "0:54:21", "throughput": 3346.55, "total_tokens": 207456304}