{ "training_metrics": [ { "step": 1, "loss": 1.3050787448883057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:22:59.835715" }, { "step": 2, "loss": 1.2078838348388672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.018219" }, { "step": 3, "loss": 1.2663317918777466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.119079" }, { "step": 4, "loss": 1.2029879093170166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.217186" }, { "step": 5, "loss": 1.3343734741210938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.337416" }, { "step": 6, "loss": 1.351973056793213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.445705" }, { "step": 7, "loss": 1.3815804719924927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.587041" }, { "step": 8, "loss": 1.465112328529358, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.672614" }, { "step": 9, "loss": 1.212660551071167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.798439" }, { "step": 10, "loss": 1.1660399436950684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.894410" }, { "step": 11, "loss": 1.1456059217453003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:00.991947" }, { "step": 12, "loss": 1.1186232566833496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.111968" }, { "step": 13, "loss": 1.0071966648101807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.206558" }, { "step": 14, "loss": 0.9148580431938171, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.294533" }, { "step": 15, "loss": 1.1758041381835938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.396025" }, { "step": 16, "loss": 1.3618204593658447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.493405" }, { "step": 17, "loss": 1.2846041917800903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.579428" }, { "step": 18, "loss": 1.147242546081543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.669254" }, { "step": 19, "loss": 1.314335823059082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.755819" }, { "step": 20, "loss": 1.2243733406066895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.848879" }, { "step": 21, "loss": 0.8789243102073669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:01.944661" }, { "step": 22, "loss": 1.0330204963684082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.031969" }, { "step": 23, "loss": 1.061643362045288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.121545" }, { "step": 24, "loss": 1.1151434183120728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.211588" }, { "step": 25, "loss": 1.4219403266906738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.300675" }, { "step": 26, "loss": 1.4582915306091309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.412264" }, { "step": 27, "loss": 1.095450520515442, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.509013" }, { "step": 28, "loss": 1.2971017360687256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.595952" }, { "step": 29, "loss": 1.4105441570281982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.688732" }, { "step": 30, "loss": 1.3414926528930664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.786310" }, { "step": 31, "loss": 1.122077226638794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.882973" }, { "step": 32, "loss": 0.9439704418182373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:02.968359" }, { "step": 33, "loss": 1.3068277835845947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.072462" }, { "step": 34, "loss": 1.1839179992675781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.199077" }, { "step": 35, "loss": 1.0622997283935547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.301756" }, { "step": 36, "loss": 1.2247941493988037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.416533" }, { "step": 37, "loss": 1.4072916507720947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.501377" }, { "step": 38, "loss": 0.8750972747802734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.594577" }, { "step": 39, "loss": 1.3152259588241577, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.694666" }, { "step": 40, "loss": 1.1265937089920044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.786760" }, { "step": 41, "loss": 1.3755652904510498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.899069" }, { "step": 42, "loss": 0.806376576423645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:03.991228" }, { "step": 43, "loss": 0.8962408304214478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.090463" }, { "step": 44, "loss": 1.2257169485092163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.182243" }, { "step": 45, "loss": 1.0779008865356445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.269260" }, { "step": 46, "loss": 1.0365169048309326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.355088" }, { "step": 47, "loss": 1.0779401063919067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.442993" }, { "step": 48, "loss": 1.2521958351135254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.527714" }, { "step": 49, "loss": 0.9483886957168579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.614934" }, { "step": 50, "loss": 1.0503500699996948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.707555" }, { "step": 51, "loss": 1.151254415512085, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.802844" }, { "step": 52, "loss": 0.9870988130569458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.899116" }, { "step": 53, "loss": 1.253812313079834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:04.984812" }, { "step": 54, "loss": 1.2173309326171875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.099658" }, { "step": 55, "loss": 1.0257377624511719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.196644" }, { "step": 56, "loss": 1.079179048538208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.283126" }, { "step": 57, "loss": 0.9472022652626038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.378780" }, { "step": 58, "loss": 1.2585573196411133, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.496079" }, { "step": 59, "loss": 0.9418714642524719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.599891" }, { "step": 60, "loss": 1.0978301763534546, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.702908" }, { "step": 61, "loss": 1.0227195024490356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.809691" }, { "step": 62, "loss": 0.9669970273971558, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:05.905427" }, { "step": 63, "loss": 1.1433448791503906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.019082" }, { "step": 64, "loss": 1.081123948097229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.113143" }, { "step": 65, "loss": 0.9723439812660217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.209939" }, { "step": 66, "loss": 1.353165626525879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.303047" }, { "step": 67, "loss": 0.7512457966804504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.392198" }, { "step": 68, "loss": 1.2829312086105347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.496323" }, { "step": 69, "loss": 0.8811122179031372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.591561" }, { "step": 70, "loss": 1.3955371379852295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.680616" }, { "step": 71, "loss": 1.219986915588379, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.776709" }, { "step": 72, "loss": 1.0334668159484863, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.867712" }, { "step": 73, "loss": 0.8768661022186279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:06.966694" }, { "step": 74, "loss": 1.1211309432983398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.071199" }, { "step": 75, "loss": 1.1337069272994995, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.159441" }, { "step": 76, "loss": 1.2960258722305298, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.276409" }, { "step": 77, "loss": 1.339566707611084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.370052" }, { "step": 78, "loss": 0.7259435057640076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.454837" }, { "step": 79, "loss": 1.049821138381958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.568019" }, { "step": 80, "loss": 0.9487711191177368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.688307" }, { "step": 81, "loss": 0.9600706100463867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.778218" }, { "step": 82, "loss": 0.9650387763977051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.876065" }, { "step": 83, "loss": 1.1003963947296143, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:07.989120" }, { "step": 84, "loss": 1.1521543264389038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.082159" }, { "step": 85, "loss": 1.3651201725006104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.178845" }, { "step": 86, "loss": 1.0866142511367798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.279182" }, { "step": 87, "loss": 1.4308860301971436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.391704" }, { "step": 88, "loss": 1.1554970741271973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.483410" }, { "step": 89, "loss": 1.126172423362732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.580806" }, { "step": 90, "loss": 1.248173713684082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.674243" }, { "step": 91, "loss": 0.9669547080993652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.767732" }, { "step": 92, "loss": 1.1082210540771484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.865835" }, { "step": 93, "loss": 1.0574169158935547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:08.960571" }, { "step": 94, "loss": 1.1422803401947021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.058269" }, { "step": 95, "loss": 1.3047819137573242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.160029" }, { "step": 96, "loss": 0.899178147315979, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.246920" }, { "step": 97, "loss": 0.9732410907745361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.332263" }, { "step": 98, "loss": 1.3599483966827393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.417840" }, { "step": 99, "loss": 1.3512098789215088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.509151" }, { "step": 100, "loss": 0.9568990468978882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.605910" }, { "step": 101, "loss": 0.66900634765625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.702183" }, { "step": 102, "loss": 0.8713931441307068, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.795150" }, { "step": 103, "loss": 1.267458200454712, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.883448" }, { "step": 104, "loss": 1.0205079317092896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:09.980602" }, { "step": 105, "loss": 1.058205485343933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.075530" }, { "step": 106, "loss": 0.9220996499061584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.169418" }, { "step": 107, "loss": 1.1730895042419434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.259033" }, { "step": 108, "loss": 1.2663350105285645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.396794" }, { "step": 109, "loss": 1.1911993026733398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.482637" }, { "step": 110, "loss": 0.7733999490737915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.569814" }, { "step": 111, "loss": 0.7724016904830933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.655195" }, { "step": 112, "loss": 0.954352855682373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.741902" }, { "step": 113, "loss": 0.9023012518882751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.835146" }, { "step": 114, "loss": 1.0058404207229614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:10.927014" }, { "step": 115, "loss": 1.2724404335021973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.046277" }, { "step": 116, "loss": 1.2620184421539307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.137664" }, { "step": 117, "loss": 1.1601855754852295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.231573" }, { "step": 118, "loss": 1.2270293235778809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.349078" }, { "step": 119, "loss": 1.1925755739212036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.434730" }, { "step": 120, "loss": 1.0487998723983765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.528645" }, { "step": 121, "loss": 0.9262097477912903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.612890" }, { "step": 122, "loss": 1.0274128913879395, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.711824" }, { "step": 123, "loss": 1.2391242980957031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.808439" }, { "step": 124, "loss": 1.3189575672149658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.899100" }, { "step": 125, "loss": 0.6779279112815857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:11.988453" }, { "step": 126, "loss": 0.7960004210472107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.077469" }, { "step": 127, "loss": 0.9792642593383789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.170093" }, { "step": 128, "loss": 1.0294883251190186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.264083" }, { "step": 129, "loss": 0.9874156713485718, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.359263" }, { "step": 130, "loss": 0.8694393038749695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.455659" }, { "step": 131, "loss": 0.9963703155517578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.573277" }, { "step": 132, "loss": 1.1515052318572998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.666350" }, { "step": 133, "loss": 1.2097642421722412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.753376" }, { "step": 134, "loss": 0.9924863576889038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.844632" }, { "step": 135, "loss": 0.7506842613220215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:12.937523" }, { "step": 136, "loss": 1.1660935878753662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.025442" }, { "step": 137, "loss": 1.1429057121276855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.120952" }, { "step": 138, "loss": 1.2277697324752808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.213666" }, { "step": 139, "loss": 1.1666080951690674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.308820" }, { "step": 140, "loss": 1.181539535522461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.404126" }, { "step": 141, "loss": 1.0800518989562988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.507770" }, { "step": 142, "loss": 1.036144733428955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.599370" }, { "step": 143, "loss": 1.0066726207733154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.701227" }, { "step": 144, "loss": 1.0505298376083374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.791598" }, { "step": 145, "loss": 1.2662677764892578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:13.886696" }, { "step": 146, "loss": 1.0714925527572632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.005172" }, { "step": 147, "loss": 0.9078054428100586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.097908" }, { "step": 148, "loss": 1.0191991329193115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.186308" }, { "step": 149, "loss": 1.372049331665039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.298888" }, { "step": 150, "loss": 1.0299190282821655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.400387" }, { "step": 151, "loss": 1.0138319730758667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.492969" }, { "step": 152, "loss": 1.0565838813781738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.592899" }, { "step": 153, "loss": 1.205650806427002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.745038" }, { "step": 154, "loss": 0.9937402606010437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.840837" }, { "step": 155, "loss": 1.373204231262207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:14.950119" }, { "step": 156, "loss": 0.9920722246170044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.047112" }, { "step": 157, "loss": 1.038219690322876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.139987" }, { "step": 158, "loss": 1.1375885009765625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.225908" }, { "step": 159, "loss": 1.172175645828247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.339626" }, { "step": 160, "loss": 0.8184976577758789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.432064" }, { "step": 161, "loss": 1.116856336593628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.519006" }, { "step": 162, "loss": 0.955221951007843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.632002" }, { "step": 163, "loss": 0.8483065366744995, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.726024" }, { "step": 164, "loss": 0.9230486154556274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.818426" }, { "step": 165, "loss": 1.0032669305801392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:15.910659" }, { "step": 166, "loss": 0.9361698627471924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.012074" }, { "step": 167, "loss": 0.7937893867492676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.112156" }, { "step": 168, "loss": 1.2238152027130127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.209823" }, { "step": 169, "loss": 1.2015044689178467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.295058" }, { "step": 170, "loss": 1.0227413177490234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.389388" }, { "step": 171, "loss": 1.0320185422897339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.481488" }, { "step": 172, "loss": 0.9202956557273865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.567972" }, { "step": 173, "loss": 1.2657225131988525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.684073" }, { "step": 174, "loss": 1.0242061614990234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.771117" }, { "step": 175, "loss": 0.9348657131195068, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.861271" }, { "step": 176, "loss": 0.9941954612731934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:16.956907" }, { "step": 177, "loss": 0.8053163290023804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.041857" }, { "step": 178, "loss": 1.049076795578003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.161127" }, { "step": 179, "loss": 1.136406421661377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.285090" }, { "step": 180, "loss": 0.6510275602340698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.373519" }, { "step": 181, "loss": 0.9205646514892578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.460063" }, { "step": 182, "loss": 0.7404705286026001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.544498" }, { "step": 183, "loss": 1.047424554824829, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.647504" }, { "step": 184, "loss": 1.1065635681152344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.733661" }, { "step": 185, "loss": 1.0873833894729614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.819041" }, { "step": 186, "loss": 0.9531699419021606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:17.906818" }, { "step": 187, "loss": 1.0485737323760986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.002763" }, { "step": 188, "loss": 1.014886736869812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.095907" }, { "step": 189, "loss": 1.2178032398223877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.211184" }, { "step": 190, "loss": 0.7610359191894531, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.303564" }, { "step": 191, "loss": 1.0535545349121094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.399480" }, { "step": 192, "loss": 0.9141170978546143, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.486800" }, { "step": 193, "loss": 0.865950345993042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.578568" }, { "step": 194, "loss": 1.0239763259887695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.673981" }, { "step": 195, "loss": 1.0136351585388184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.759061" }, { "step": 196, "loss": 0.8811721801757812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.854564" }, { "step": 197, "loss": 0.8067998290061951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:18.943531" }, { "step": 198, "loss": 0.9961643218994141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.029866" }, { "step": 199, "loss": 0.9516854286193848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.122559" }, { "step": 200, "loss": 1.057553768157959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.213704" }, { "step": 201, "loss": 1.0080459117889404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.303315" }, { "step": 202, "loss": 1.144012689590454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.392146" }, { "step": 203, "loss": 1.1004252433776855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.534872" }, { "step": 204, "loss": 0.9167330265045166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.626995" }, { "step": 205, "loss": 1.16129469871521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.711335" }, { "step": 206, "loss": 0.771239161491394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.804958" }, { "step": 207, "loss": 1.3989214897155762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:19.917982" }, { "step": 208, "loss": 0.8565049767494202, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.002923" }, { "step": 209, "loss": 0.7429771423339844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.095112" }, { "step": 210, "loss": 1.024583101272583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.185146" }, { "step": 211, "loss": 0.7049229145050049, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.274857" }, { "step": 212, "loss": 0.6496537923812866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.366465" }, { "step": 213, "loss": 1.1211764812469482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.490794" }, { "step": 214, "loss": 0.9313467741012573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.581240" }, { "step": 215, "loss": 0.9920042753219604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.677127" }, { "step": 216, "loss": 1.0744054317474365, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.767188" }, { "step": 217, "loss": 1.0307865142822266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.885440" }, { "step": 218, "loss": 0.9189707040786743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:20.983898" }, { "step": 219, "loss": 0.8124669790267944, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.070710" }, { "step": 220, "loss": 0.9004138112068176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.156612" }, { "step": 221, "loss": 1.1746535301208496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.244022" }, { "step": 222, "loss": 0.8075965642929077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.337084" }, { "step": 223, "loss": 0.8815158605575562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.431209" }, { "step": 224, "loss": 0.8423941135406494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.518213" }, { "step": 225, "loss": 0.8229867815971375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.619513" }, { "step": 226, "loss": 1.081260323524475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.709114" }, { "step": 227, "loss": 1.1420092582702637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.809104" }, { "step": 228, "loss": 0.7469054460525513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:21.894274" }, { "step": 229, "loss": 0.9589672088623047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.008453" }, { "step": 230, "loss": 1.006912350654602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.092665" }, { "step": 231, "loss": 1.1954916715621948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.212247" }, { "step": 232, "loss": 1.1728932857513428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.304771" }, { "step": 233, "loss": 1.0483267307281494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.392598" }, { "step": 234, "loss": 1.0153841972351074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.485744" }, { "step": 235, "loss": 1.2020751237869263, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.575091" }, { "step": 236, "loss": 0.6838197708129883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.661141" }, { "step": 237, "loss": 0.8458431959152222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.757796" }, { "step": 238, "loss": 1.0748976469039917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.858914" }, { "step": 239, "loss": 0.9099082350730896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:22.944509" }, { "step": 240, "loss": 1.0588456392288208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.035075" }, { "step": 241, "loss": 1.0514596700668335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.127867" }, { "step": 242, "loss": 1.106227159500122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.225543" }, { "step": 243, "loss": 0.6501455903053284, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.313885" }, { "step": 244, "loss": 1.0700569152832031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.435802" }, { "step": 245, "loss": 0.8423296213150024, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.528716" }, { "step": 246, "loss": 0.8979228734970093, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.617557" }, { "step": 247, "loss": 0.8162924647331238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.705715" }, { "step": 248, "loss": 0.9356038570404053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.798103" }, { "step": 249, "loss": 0.8190819025039673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.883335" }, { "step": 250, "loss": 1.0329935550689697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:23.973769" }, { "step": 251, "loss": 1.2711927890777588, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.059608" }, { "step": 252, "loss": 0.7415053844451904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.145660" }, { "step": 253, "loss": 1.1272684335708618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.236102" }, { "step": 254, "loss": 0.8926275968551636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.349639" }, { "step": 255, "loss": 0.6990458965301514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.443176" }, { "step": 256, "loss": 1.0282355546951294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.532861" }, { "step": 257, "loss": 1.32956063747406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.682567" }, { "step": 258, "loss": 0.9525560140609741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.774084" }, { "step": 259, "loss": 1.1152904033660889, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:24.884486" }, { "step": 260, "loss": 1.1152586936950684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.005783" }, { "step": 261, "loss": 1.1430402994155884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.094049" }, { "step": 262, "loss": 0.9953980445861816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.191126" }, { "step": 263, "loss": 0.7908657789230347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.278757" }, { "step": 264, "loss": 0.9746399521827698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.397469" }, { "step": 265, "loss": 1.1198363304138184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.489862" }, { "step": 266, "loss": 1.3370811939239502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.585185" }, { "step": 267, "loss": 1.0487600564956665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.678736" }, { "step": 268, "loss": 0.9171916246414185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.767336" }, { "step": 269, "loss": 0.9516528844833374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.867352" }, { "step": 270, "loss": 0.8783036470413208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:25.959265" }, { "step": 271, "loss": 0.8060846328735352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.045269" }, { "step": 272, "loss": 0.8466569185256958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.134680" }, { "step": 273, "loss": 1.0817171335220337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.264684" }, { "step": 274, "loss": 0.9113312363624573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.364728" }, { "step": 275, "loss": 0.9165505170822144, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.456723" }, { "step": 276, "loss": 1.020063877105713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.581356" }, { "step": 277, "loss": 1.016211986541748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.671792" }, { "step": 278, "loss": 0.8753834366798401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.769148" }, { "step": 279, "loss": 1.0813932418823242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.860848" }, { "step": 280, "loss": 1.0208675861358643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:26.948711" }, { "step": 281, "loss": 1.0998353958129883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.064747" }, { "step": 282, "loss": 0.9793296456336975, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.157581" }, { "step": 283, "loss": 1.0552709102630615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.254475" }, { "step": 284, "loss": 1.137678623199463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.365727" }, { "step": 285, "loss": 0.9670683145523071, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.457011" }, { "step": 286, "loss": 0.9862388968467712, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.560478" }, { "step": 287, "loss": 0.8304272890090942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.645385" }, { "step": 288, "loss": 0.9268807172775269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.734068" }, { "step": 289, "loss": 0.7760207653045654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.820643" }, { "step": 290, "loss": 1.225726842880249, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:27.936351" }, { "step": 291, "loss": 1.0068875551223755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.057963" }, { "step": 292, "loss": 1.1235895156860352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.174087" }, { "step": 293, "loss": 1.0673545598983765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.301954" }, { "step": 294, "loss": 0.9814757108688354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.395915" }, { "step": 295, "loss": 1.034455418586731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.514218" }, { "step": 296, "loss": 0.8248984217643738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.605730" }, { "step": 297, "loss": 1.1779937744140625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.698829" }, { "step": 298, "loss": 0.9323928356170654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.789682" }, { "step": 299, "loss": 0.8421998023986816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.879626" }, { "step": 300, "loss": 0.8538090586662292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:28.974906" }, { "step": 301, "loss": 0.9259281158447266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.056379" }, { "step": 302, "loss": 0.8828160762786865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.140669" }, { "step": 303, "loss": 0.87471604347229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.232371" }, { "step": 304, "loss": 1.1027024984359741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.326709" }, { "step": 305, "loss": 1.0356413125991821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.449162" }, { "step": 306, "loss": 1.1665071249008179, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.536648" }, { "step": 307, "loss": 1.0879212617874146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.651496" }, { "step": 308, "loss": 0.8005954027175903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.735775" }, { "step": 309, "loss": 0.8192386627197266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.828673" }, { "step": 310, "loss": 0.6475479006767273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:29.913227" }, { "step": 311, "loss": 1.2005733251571655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.000383" }, { "step": 312, "loss": 0.8259143829345703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.088764" }, { "step": 313, "loss": 0.84437096118927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.176479" }, { "step": 314, "loss": 0.6710930466651917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.267322" }, { "step": 315, "loss": 1.0215888023376465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.357362" }, { "step": 316, "loss": 1.0539754629135132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.450005" }, { "step": 317, "loss": 0.7388505935668945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.536968" }, { "step": 318, "loss": 0.7909910082817078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.622389" }, { "step": 319, "loss": 1.3333938121795654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.710105" }, { "step": 320, "loss": 0.9219117164611816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.819240" }, { "step": 321, "loss": 0.9464453458786011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.908145" }, { "step": 322, "loss": 1.1504666805267334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:30.993537" }, { "step": 323, "loss": 1.0680902004241943, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.107800" }, { "step": 324, "loss": 0.8451797962188721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.220552" }, { "step": 325, "loss": 1.3121073246002197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.353544" }, { "step": 326, "loss": 1.0015805959701538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.441210" }, { "step": 327, "loss": 0.8915814161300659, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.540867" }, { "step": 328, "loss": 0.917847216129303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.630412" }, { "step": 329, "loss": 1.1189594268798828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.717706" }, { "step": 330, "loss": 1.1791408061981201, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.835344" }, { "step": 331, "loss": 0.8247785568237305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:31.935292" }, { "step": 332, "loss": 0.6690821647644043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.025886" }, { "step": 333, "loss": 0.9799471497535706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.139549" }, { "step": 334, "loss": 0.9471340179443359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.229547" }, { "step": 335, "loss": 0.7814834117889404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.330028" }, { "step": 336, "loss": 0.8724034428596497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.444283" }, { "step": 337, "loss": 1.0430718660354614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.533650" }, { "step": 338, "loss": 0.8882424831390381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.619189" }, { "step": 339, "loss": 1.0604846477508545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.704361" }, { "step": 340, "loss": 1.104205846786499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.789295" }, { "step": 341, "loss": 1.2247434854507446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.896333" }, { "step": 342, "loss": 0.726254940032959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:32.990321" }, { "step": 343, "loss": 1.052728533744812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.088953" }, { "step": 344, "loss": 0.6391576528549194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.188969" }, { "step": 345, "loss": 0.8079032897949219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.273973" }, { "step": 346, "loss": 0.827389121055603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.371539" }, { "step": 347, "loss": 1.1713037490844727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.486344" }, { "step": 348, "loss": 0.7702492475509644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.572311" }, { "step": 349, "loss": 0.7986340522766113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.668100" }, { "step": 350, "loss": 1.0324089527130127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.779910" }, { "step": 351, "loss": 1.0330963134765625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.905313" }, { "step": 352, "loss": 0.9828975200653076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:33.999825" }, { "step": 353, "loss": 0.6410664916038513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.087593" }, { "step": 354, "loss": 0.6034155488014221, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.175026" }, { "step": 355, "loss": 0.8771579265594482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.272601" }, { "step": 356, "loss": 1.3789119720458984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.388499" }, { "step": 357, "loss": 1.0358480215072632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.508009" }, { "step": 358, "loss": 1.249760389328003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.603367" }, { "step": 359, "loss": 0.8794363737106323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.690135" }, { "step": 360, "loss": 1.0043132305145264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.777704" }, { "step": 361, "loss": 0.8683585524559021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.873389" }, { "step": 362, "loss": 0.716355562210083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:34.968493" }, { "step": 363, "loss": 1.143733263015747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.078063" }, { "step": 364, "loss": 1.169050931930542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.171788" }, { "step": 365, "loss": 1.0854949951171875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.283816" }, { "step": 366, "loss": 1.0847289562225342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.411654" }, { "step": 367, "loss": 0.8840438723564148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.505814" }, { "step": 368, "loss": 0.8062880039215088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.603519" }, { "step": 369, "loss": 0.9567775130271912, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.687911" }, { "step": 370, "loss": 0.9526263475418091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.773676" }, { "step": 371, "loss": 1.1530170440673828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:35.910477" }, { "step": 372, "loss": 0.9376751780509949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.006715" }, { "step": 373, "loss": 1.0597378015518188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.105701" }, { "step": 374, "loss": 0.8837941884994507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.221527" }, { "step": 375, "loss": 0.951033890247345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.312907" }, { "step": 376, "loss": 1.0856374502182007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.435995" }, { "step": 377, "loss": 0.7438244223594666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.535546" }, { "step": 378, "loss": 0.9435797333717346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.628895" }, { "step": 379, "loss": 0.7998467683792114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.713857" }, { "step": 380, "loss": 0.9239392280578613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.800535" }, { "step": 381, "loss": 0.9461100101470947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.885533" }, { "step": 382, "loss": 1.0730273723602295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:36.977350" }, { "step": 383, "loss": 1.1297657489776611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.064039" }, { "step": 384, "loss": 0.7439780235290527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.182695" }, { "step": 385, "loss": 1.1253591775894165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.272497" }, { "step": 386, "loss": 1.0689376592636108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.402210" }, { "step": 387, "loss": 0.6899427771568298, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.487825" }, { "step": 388, "loss": 0.7299132347106934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.587407" }, { "step": 389, "loss": 0.7541588544845581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.677359" }, { "step": 390, "loss": 0.7740375399589539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.799400" }, { "step": 391, "loss": 0.9142655730247498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.896831" }, { "step": 392, "loss": 0.7508710026741028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:37.992263" }, { "step": 393, "loss": 0.6070233583450317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.079975" }, { "step": 394, "loss": 1.204479694366455, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.206294" }, { "step": 395, "loss": 0.8948452472686768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.299102" }, { "step": 396, "loss": 0.9227185249328613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.391182" }, { "step": 397, "loss": 0.6877582669258118, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.482941" }, { "step": 398, "loss": 0.884697675704956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.576382" }, { "step": 399, "loss": 1.1973178386688232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.661309" }, { "step": 400, "loss": 0.6780576705932617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.749554" }, { "step": 401, "loss": 1.1080093383789062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.836732" }, { "step": 402, "loss": 0.8101420402526855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:38.934446" }, { "step": 403, "loss": 0.773280918598175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.021459" }, { "step": 404, "loss": 0.8535457849502563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.108070" }, { "step": 405, "loss": 1.2719215154647827, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.195455" }, { "step": 406, "loss": 1.1348247528076172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.289099" }, { "step": 407, "loss": 0.8661947250366211, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.378190" }, { "step": 408, "loss": 0.9036744236946106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.463398" }, { "step": 409, "loss": 0.838208794593811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.548299" }, { "step": 410, "loss": 0.9179588556289673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.671142" }, { "step": 411, "loss": 1.0539608001708984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.757012" }, { "step": 412, "loss": 0.7337026596069336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.844748" }, { "step": 413, "loss": 0.7482527494430542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:39.942911" }, { "step": 414, "loss": 0.6325270533561707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.034700" }, { "step": 415, "loss": 1.0214309692382812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.120533" }, { "step": 416, "loss": 0.8690586090087891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.232945" }, { "step": 417, "loss": 0.9112792611122131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.330907" }, { "step": 418, "loss": 0.9991483688354492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.415463" }, { "step": 419, "loss": 1.0035390853881836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.529387" }, { "step": 420, "loss": 0.8882923126220703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.615289" }, { "step": 421, "loss": 0.7913491129875183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.704464" }, { "step": 422, "loss": 1.1882169246673584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.789117" }, { "step": 423, "loss": 1.0074620246887207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:40.914909" }, { "step": 424, "loss": 0.8552249670028687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.032778" }, { "step": 425, "loss": 0.8104555606842041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.146465" }, { "step": 426, "loss": 0.6600808501243591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.236225" }, { "step": 427, "loss": 1.316282033920288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.319868" }, { "step": 428, "loss": 0.9039617776870728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.406749" }, { "step": 429, "loss": 0.729335606098175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.504486" }, { "step": 430, "loss": 0.9095984697341919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.590087" }, { "step": 431, "loss": 1.2311749458312988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.709262" }, { "step": 432, "loss": 0.7047393321990967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.797784" }, { "step": 433, "loss": 1.059227705001831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:41.907848" }, { "step": 434, "loss": 1.319867491722107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.000403" }, { "step": 435, "loss": 0.5512518286705017, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.086034" }, { "step": 436, "loss": 0.5026146173477173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.173900" }, { "step": 437, "loss": 0.7653348445892334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.265442" }, { "step": 438, "loss": 0.9584765434265137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.354168" }, { "step": 439, "loss": 0.9230166673660278, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.438405" }, { "step": 440, "loss": 1.2503669261932373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.564689" }, { "step": 441, "loss": 0.9432649612426758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.655322" }, { "step": 442, "loss": 0.8798277378082275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.742167" }, { "step": 443, "loss": 0.6428899765014648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.839266" }, { "step": 444, "loss": 0.8464118242263794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:42.925674" }, { "step": 445, "loss": 0.58531254529953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.016932" }, { "step": 446, "loss": 0.3662051558494568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.108139" }, { "step": 447, "loss": 1.0588213205337524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.203286" }, { "step": 448, "loss": 1.1201095581054688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.318213" }, { "step": 449, "loss": 0.8565226793289185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.430844" }, { "step": 450, "loss": 0.8522786498069763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.522358" }, { "step": 451, "loss": 0.8746011257171631, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.629671" }, { "step": 452, "loss": 1.0677416324615479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.718590" }, { "step": 453, "loss": 0.9620256423950195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.811241" }, { "step": 454, "loss": 0.7626394033432007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.902468" }, { "step": 455, "loss": 0.8417598009109497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:43.993192" }, { "step": 456, "loss": 1.1507905721664429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.106571" }, { "step": 457, "loss": 1.1296881437301636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.222591" }, { "step": 458, "loss": 0.8800339102745056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.315683" }, { "step": 459, "loss": 0.8326114416122437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.431037" }, { "step": 460, "loss": 0.7486791610717773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.523134" }, { "step": 461, "loss": 1.231128215789795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.635995" }, { "step": 462, "loss": 0.944777250289917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.759181" }, { "step": 463, "loss": 0.9935376644134521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.852190" }, { "step": 464, "loss": 1.0805580615997314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:44.953362" }, { "step": 465, "loss": 0.9056864976882935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.036979" }, { "step": 466, "loss": 0.6823549270629883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.134737" }, { "step": 467, "loss": 0.7081266641616821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.225891" }, { "step": 468, "loss": 0.9259730577468872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.313568" }, { "step": 469, "loss": 1.0057159662246704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.398536" }, { "step": 470, "loss": 0.9501736164093018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.485205" }, { "step": 471, "loss": 0.7312370538711548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.581948" }, { "step": 472, "loss": 0.7402532696723938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.700711" }, { "step": 473, "loss": 0.8168851137161255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.792639" }, { "step": 474, "loss": 0.9470968246459961, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:45.903921" }, { "step": 475, "loss": 1.1195228099822998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.019986" }, { "step": 476, "loss": 0.9236838817596436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.104903" }, { "step": 477, "loss": 1.1218373775482178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.237755" }, { "step": 478, "loss": 1.21327805519104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.354283" }, { "step": 479, "loss": 0.6653346419334412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.444936" }, { "step": 480, "loss": 0.7336678504943848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.536626" }, { "step": 481, "loss": 0.8088697195053101, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.630099" }, { "step": 482, "loss": 1.1593656539916992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.751982" }, { "step": 483, "loss": 0.8096703886985779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.836952" }, { "step": 484, "loss": 0.8816382884979248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:46.929588" }, { "step": 485, "loss": 0.6060751676559448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.025872" }, { "step": 486, "loss": 0.896709680557251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.116285" }, { "step": 487, "loss": 0.7773913145065308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.210655" }, { "step": 488, "loss": 1.2889087200164795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.295090" }, { "step": 489, "loss": 0.9140845537185669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.428624" }, { "step": 490, "loss": 0.6206951141357422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.516568" }, { "step": 491, "loss": 0.7009551525115967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.616145" }, { "step": 492, "loss": 0.8614954948425293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.703331" }, { "step": 493, "loss": 0.563684344291687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.800544" }, { "step": 494, "loss": 0.9608831405639648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:47.885945" }, { "step": 495, "loss": 1.1308081150054932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.010733" }, { "step": 496, "loss": 1.1646283864974976, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.105685" }, { "step": 497, "loss": 1.0601484775543213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.198446" }, { "step": 498, "loss": 0.7879912257194519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.283158" }, { "step": 499, "loss": 0.943706750869751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.369607" }, { "step": 500, "loss": 0.9561386108398438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:23:48.463008" }, { "step": 501, "loss": 0.8832870721817017, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.262906" }, { "step": 502, "loss": 0.8614141941070557, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.365428" }, { "step": 503, "loss": 0.7987558245658875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.461633" }, { "step": 504, "loss": 1.0324549674987793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.576162" }, { "step": 505, "loss": 0.9854774475097656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.676235" }, { "step": 506, "loss": 0.7400413155555725, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.761779" }, { "step": 507, "loss": 1.0634453296661377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.858748" }, { "step": 508, "loss": 1.0954358577728271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:11.951165" }, { "step": 509, "loss": 0.7309540510177612, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.045369" }, { "step": 510, "loss": 0.7491720914840698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.135055" }, { "step": 511, "loss": 0.8831789493560791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.219262" }, { "step": 512, "loss": 0.8217372894287109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.305280" }, { "step": 513, "loss": 1.0742322206497192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.399636" }, { "step": 514, "loss": 0.716166615486145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.489148" }, { "step": 515, "loss": 1.146081805229187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.608082" }, { "step": 516, "loss": 0.8536627292633057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.699152" }, { "step": 517, "loss": 0.9283041954040527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.786199" }, { "step": 518, "loss": 0.9304966926574707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.875226" }, { "step": 519, "loss": 1.2809308767318726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:12.964904" }, { "step": 520, "loss": 0.6101891994476318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.071545" }, { "step": 521, "loss": 0.9347330927848816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.165130" }, { "step": 522, "loss": 0.6337159276008606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.254736" }, { "step": 523, "loss": 1.0832293033599854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.364310" }, { "step": 524, "loss": 0.8452403545379639, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.459247" }, { "step": 525, "loss": 0.982178807258606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.554323" }, { "step": 526, "loss": 0.6512837409973145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.657121" }, { "step": 527, "loss": 1.3843578100204468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.744062" }, { "step": 528, "loss": 0.8656461238861084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.831357" }, { "step": 529, "loss": 0.9735211133956909, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:13.916616" }, { "step": 530, "loss": 0.9993297457695007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.009404" }, { "step": 531, "loss": 0.9843109250068665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.101854" }, { "step": 532, "loss": 1.0474947690963745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.191065" }, { "step": 533, "loss": 0.5618821382522583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.278988" }, { "step": 534, "loss": 1.0090460777282715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.367018" }, { "step": 535, "loss": 1.1607697010040283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.464969" }, { "step": 536, "loss": 1.2201876640319824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.555196" }, { "step": 537, "loss": 0.8878445625305176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.653999" }, { "step": 538, "loss": 0.6891810894012451, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.743608" }, { "step": 539, "loss": 0.85243821144104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.834301" }, { "step": 540, "loss": 0.8087791800498962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:14.931153" }, { "step": 541, "loss": 0.7120470404624939, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.032537" }, { "step": 542, "loss": 1.0121769905090332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.142862" }, { "step": 543, "loss": 0.5740492939949036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.229992" }, { "step": 544, "loss": 1.166844129562378, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.317685" }, { "step": 545, "loss": 1.0672228336334229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.431987" }, { "step": 546, "loss": 0.7389703392982483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.533252" }, { "step": 547, "loss": 1.0855716466903687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.645335" }, { "step": 548, "loss": 0.7042009830474854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.732572" }, { "step": 549, "loss": 1.1004143953323364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.849309" }, { "step": 550, "loss": 1.068941593170166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:15.934231" }, { "step": 551, "loss": 0.7473564147949219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.019436" }, { "step": 552, "loss": 1.0405232906341553, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.111474" }, { "step": 553, "loss": 0.8828482627868652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.204270" }, { "step": 554, "loss": 0.6712629199028015, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.299118" }, { "step": 555, "loss": 0.9776933193206787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.385763" }, { "step": 556, "loss": 1.059738278388977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.500632" }, { "step": 557, "loss": 1.1276445388793945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.614386" }, { "step": 558, "loss": 0.5439015626907349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.713865" }, { "step": 559, "loss": 0.9748817682266235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.832172" }, { "step": 560, "loss": 0.7483049631118774, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:16.933308" }, { "step": 561, "loss": 0.7872772216796875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.021276" }, { "step": 562, "loss": 1.0594642162322998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.114484" }, { "step": 563, "loss": 0.9832146167755127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.207928" }, { "step": 564, "loss": 0.7043198347091675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.292734" }, { "step": 565, "loss": 0.9533512592315674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.410339" }, { "step": 566, "loss": 0.7111992835998535, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.501482" }, { "step": 567, "loss": 0.949575662612915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.612779" }, { "step": 568, "loss": 1.1394915580749512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.697756" }, { "step": 569, "loss": 1.0161248445510864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.785518" }, { "step": 570, "loss": 1.0409795045852661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:17.915460" }, { "step": 571, "loss": 0.8805245161056519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.006989" }, { "step": 572, "loss": 0.8704512119293213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.105518" }, { "step": 573, "loss": 0.5598913431167603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.190775" }, { "step": 574, "loss": 0.8058819770812988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.290981" }, { "step": 575, "loss": 0.8740168809890747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.381248" }, { "step": 576, "loss": 0.6787643432617188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.474982" }, { "step": 577, "loss": 0.9914801120758057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.563544" }, { "step": 578, "loss": 0.537498950958252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.648669" }, { "step": 579, "loss": 1.00816011428833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.789839" }, { "step": 580, "loss": 0.7377841472625732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.876263" }, { "step": 581, "loss": 1.0015766620635986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:18.962507" }, { "step": 582, "loss": 0.7288545370101929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.064024" }, { "step": 583, "loss": 0.8286885023117065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.185123" }, { "step": 584, "loss": 0.7355365753173828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.276259" }, { "step": 585, "loss": 1.0190036296844482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.369024" }, { "step": 586, "loss": 0.7989758253097534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.460577" }, { "step": 587, "loss": 1.3194202184677124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.552489" }, { "step": 588, "loss": 0.6123311519622803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.644737" }, { "step": 589, "loss": 0.9219006299972534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.759644" }, { "step": 590, "loss": 1.108147144317627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.883203" }, { "step": 591, "loss": 1.2147467136383057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:19.973767" }, { "step": 592, "loss": 0.77805495262146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.078888" }, { "step": 593, "loss": 1.2259743213653564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.201516" }, { "step": 594, "loss": 0.773209810256958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.295888" }, { "step": 595, "loss": 0.7093479633331299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.382732" }, { "step": 596, "loss": 0.9244993329048157, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.471398" }, { "step": 597, "loss": 1.0217846632003784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.563201" }, { "step": 598, "loss": 0.862676203250885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.660606" }, { "step": 599, "loss": 0.521963357925415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.746453" }, { "step": 600, "loss": 0.6976065635681152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.844865" }, { "step": 601, "loss": 0.8973067998886108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:20.933075" }, { "step": 602, "loss": 0.8826678991317749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.056681" }, { "step": 603, "loss": 1.0947035551071167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.180480" }, { "step": 604, "loss": 0.7709010243415833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.281746" }, { "step": 605, "loss": 1.0213173627853394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.373101" }, { "step": 606, "loss": 0.8142729997634888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.466574" }, { "step": 607, "loss": 1.0851343870162964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.564172" }, { "step": 608, "loss": 1.0709824562072754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.656568" }, { "step": 609, "loss": 0.9929410219192505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.753964" }, { "step": 610, "loss": 0.7767935991287231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.838032" }, { "step": 611, "loss": 1.1285254955291748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:21.952508" }, { "step": 612, "loss": 0.6442114114761353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.039514" }, { "step": 613, "loss": 0.9082322120666504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.139610" }, { "step": 614, "loss": 0.8053550124168396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.235736" }, { "step": 615, "loss": 0.8365138173103333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.321900" }, { "step": 616, "loss": 0.8731719255447388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.445276" }, { "step": 617, "loss": 1.0733591318130493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.533990" }, { "step": 618, "loss": 1.151520013809204, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.634230" }, { "step": 619, "loss": 0.6450933218002319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.735483" }, { "step": 620, "loss": 1.061762809753418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.819787" }, { "step": 621, "loss": 0.8897079229354858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.905201" }, { "step": 622, "loss": 1.1165064573287964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:22.991392" }, { "step": 623, "loss": 0.8433017730712891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.076451" }, { "step": 624, "loss": 0.8309490084648132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.166609" }, { "step": 625, "loss": 0.9169985055923462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.265731" }, { "step": 626, "loss": 0.9625258445739746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.361228" }, { "step": 627, "loss": 0.6397137641906738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.452935" }, { "step": 628, "loss": 0.9055684208869934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.539312" }, { "step": 629, "loss": 0.6585572957992554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.632984" }, { "step": 630, "loss": 0.972169816493988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.742130" }, { "step": 631, "loss": 0.5203886032104492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.830473" }, { "step": 632, "loss": 0.7756165266036987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:23.930685" }, { "step": 633, "loss": 0.6674431562423706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.014093" }, { "step": 634, "loss": 0.5377005338668823, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.100206" }, { "step": 635, "loss": 0.8013380765914917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.196080" }, { "step": 636, "loss": 0.8359743356704712, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.290727" }, { "step": 637, "loss": 0.8492889404296875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.385261" }, { "step": 638, "loss": 0.9855073690414429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.479891" }, { "step": 639, "loss": 0.8762567639350891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.573516" }, { "step": 640, "loss": 1.0613601207733154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.663669" }, { "step": 641, "loss": 0.6265792846679688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.755899" }, { "step": 642, "loss": 1.116650104522705, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.874505" }, { "step": 643, "loss": 0.661430299282074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:24.966958" }, { "step": 644, "loss": 1.0431841611862183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.067909" }, { "step": 645, "loss": 0.798627495765686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.191190" }, { "step": 646, "loss": 1.0178494453430176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.275548" }, { "step": 647, "loss": 0.5732675790786743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.367548" }, { "step": 648, "loss": 1.0109878778457642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.454314" }, { "step": 649, "loss": 1.1108477115631104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.541150" }, { "step": 650, "loss": 0.8398318290710449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.630899" }, { "step": 651, "loss": 0.6946483254432678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.715570" }, { "step": 652, "loss": 1.240126371383667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.837170" }, { "step": 653, "loss": 0.5139456987380981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:25.929993" }, { "step": 654, "loss": 0.5992851257324219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.022728" }, { "step": 655, "loss": 0.7991337180137634, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.108182" }, { "step": 656, "loss": 0.3652641177177429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.201551" }, { "step": 657, "loss": 0.5388368368148804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.288849" }, { "step": 658, "loss": 0.7613836526870728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.380213" }, { "step": 659, "loss": 0.8513718843460083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.483623" }, { "step": 660, "loss": 0.6463839411735535, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.570224" }, { "step": 661, "loss": 0.7910126447677612, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.669217" }, { "step": 662, "loss": 0.8002768754959106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.760471" }, { "step": 663, "loss": 1.1216663122177124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.879304" }, { "step": 664, "loss": 0.7329313158988953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:26.977956" }, { "step": 665, "loss": 0.8241696357727051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.077471" }, { "step": 666, "loss": 1.3708162307739258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.166898" }, { "step": 667, "loss": 0.8733571767807007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.262325" }, { "step": 668, "loss": 0.9484143257141113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.350662" }, { "step": 669, "loss": 0.46131670475006104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.440915" }, { "step": 670, "loss": 0.9065471887588501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.528671" }, { "step": 671, "loss": 0.8836148381233215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.612205" }, { "step": 672, "loss": 0.8271085023880005, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.703638" }, { "step": 673, "loss": 0.9083006381988525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.795634" }, { "step": 674, "loss": 0.8741034269332886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.881904" }, { "step": 675, "loss": 0.7223389148712158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:27.968539" }, { "step": 676, "loss": 1.4963951110839844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.061031" }, { "step": 677, "loss": 1.0274271965026855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.184329" }, { "step": 678, "loss": 0.744950532913208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.275502" }, { "step": 679, "loss": 0.9222225546836853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.360837" }, { "step": 680, "loss": 0.9042009115219116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.472363" }, { "step": 681, "loss": 0.583402156829834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.565678" }, { "step": 682, "loss": 0.7606973648071289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.650671" }, { "step": 683, "loss": 0.583808183670044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.735809" }, { "step": 684, "loss": 0.695250391960144, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.833289" }, { "step": 685, "loss": 0.8879551291465759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:28.926486" }, { "step": 686, "loss": 0.9738034009933472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.010356" }, { "step": 687, "loss": 0.8030788898468018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.102089" }, { "step": 688, "loss": 0.7668824791908264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.204460" }, { "step": 689, "loss": 1.01244056224823, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.317137" }, { "step": 690, "loss": 0.9859507083892822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.405072" }, { "step": 691, "loss": 1.1238012313842773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.544069" }, { "step": 692, "loss": 0.872995913028717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.663605" }, { "step": 693, "loss": 1.2703293561935425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.749436" }, { "step": 694, "loss": 0.7866307497024536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.850859" }, { "step": 695, "loss": 0.8361921310424805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:29.947952" }, { "step": 696, "loss": 0.8845713138580322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.040617" }, { "step": 697, "loss": 0.9008805751800537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.133287" }, { "step": 698, "loss": 0.9516750574111938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.227492" }, { "step": 699, "loss": 0.9175969362258911, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.320960" }, { "step": 700, "loss": 0.7831265926361084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.410766" }, { "step": 701, "loss": 0.8964943885803223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.552400" }, { "step": 702, "loss": 0.5136051177978516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.655547" }, { "step": 703, "loss": 0.8515502214431763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.747002" }, { "step": 704, "loss": 0.7020877599716187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.832686" }, { "step": 705, "loss": 0.9811851978302002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:30.925314" }, { "step": 706, "loss": 0.8338496685028076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.024062" }, { "step": 707, "loss": 0.5083923935890198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.109980" }, { "step": 708, "loss": 1.0611273050308228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.205530" }, { "step": 709, "loss": 0.7003802061080933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.310047" }, { "step": 710, "loss": 0.7486763000488281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.409394" }, { "step": 711, "loss": 1.1283022165298462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.496627" }, { "step": 712, "loss": 1.1055413484573364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.648289" }, { "step": 713, "loss": 1.066116452217102, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.764066" }, { "step": 714, "loss": 0.8267605304718018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.856954" }, { "step": 715, "loss": 0.8945412635803223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:31.955825" }, { "step": 716, "loss": 1.061569333076477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.053857" }, { "step": 717, "loss": 0.8763951063156128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.162743" }, { "step": 718, "loss": 0.7545145750045776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.270448" }, { "step": 719, "loss": 0.6093243360519409, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.367066" }, { "step": 720, "loss": 1.1344761848449707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.477460" }, { "step": 721, "loss": 0.6900872588157654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.566035" }, { "step": 722, "loss": 0.8812373876571655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.657675" }, { "step": 723, "loss": 1.18498694896698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.770046" }, { "step": 724, "loss": 0.5833555459976196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.856378" }, { "step": 725, "loss": 0.9139548540115356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:32.953886" }, { "step": 726, "loss": 0.9359950423240662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.039690" }, { "step": 727, "loss": 0.9409313201904297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.132645" }, { "step": 728, "loss": 0.676138162612915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.229833" }, { "step": 729, "loss": 0.6856882572174072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.323817" }, { "step": 730, "loss": 1.0773696899414062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.417360" }, { "step": 731, "loss": 1.0915865898132324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.506041" }, { "step": 732, "loss": 0.9267287850379944, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.600088" }, { "step": 733, "loss": 0.8584641218185425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.691448" }, { "step": 734, "loss": 0.6938006281852722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:33.931523" }, { "step": 735, "loss": 1.0148556232452393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.021327" }, { "step": 736, "loss": 1.1910054683685303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.133319" }, { "step": 737, "loss": 0.9798187017440796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.227719" }, { "step": 738, "loss": 0.669413685798645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.331535" }, { "step": 739, "loss": 0.7706905603408813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.426310" }, { "step": 740, "loss": 0.8088266253471375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.543543" }, { "step": 741, "loss": 0.7302885055541992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.642409" }, { "step": 742, "loss": 1.1155155897140503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.732576" }, { "step": 743, "loss": 0.30197444558143616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.819648" }, { "step": 744, "loss": 0.984937310218811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:34.920003" }, { "step": 745, "loss": 0.8381345272064209, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.004843" }, { "step": 746, "loss": 0.8607252836227417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.100260" }, { "step": 747, "loss": 0.813067615032196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.186042" }, { "step": 748, "loss": 0.8455133438110352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.279806" }, { "step": 749, "loss": 0.8631391525268555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.373916" }, { "step": 750, "loss": 0.8824008107185364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.466979" }, { "step": 751, "loss": 0.8955533504486084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.553086" }, { "step": 752, "loss": 0.9780110716819763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.640881" }, { "step": 753, "loss": 0.7948328256607056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.725795" }, { "step": 754, "loss": 0.8393138647079468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.836880" }, { "step": 755, "loss": 0.9315209984779358, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:35.950058" }, { "step": 756, "loss": 0.6848862171173096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.046565" }, { "step": 757, "loss": 0.747799813747406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.142152" }, { "step": 758, "loss": 0.9372379183769226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.228238" }, { "step": 759, "loss": 0.9743911027908325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.336043" }, { "step": 760, "loss": 0.7758783102035522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.425454" }, { "step": 761, "loss": 0.957741379737854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.520890" }, { "step": 762, "loss": 0.730352520942688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.620658" }, { "step": 763, "loss": 1.0826396942138672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.736699" }, { "step": 764, "loss": 0.8350582122802734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.820929" }, { "step": 765, "loss": 1.0187363624572754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:36.934345" }, { "step": 766, "loss": 1.0943995714187622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.025386" }, { "step": 767, "loss": 1.1965428590774536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.160388" }, { "step": 768, "loss": 0.7461786270141602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.277544" }, { "step": 769, "loss": 0.8615906238555908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.386540" }, { "step": 770, "loss": 1.5781065225601196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.471921" }, { "step": 771, "loss": 0.6872075796127319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.562698" }, { "step": 772, "loss": 0.7841407060623169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.649023" }, { "step": 773, "loss": 0.7616927623748779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.739735" }, { "step": 774, "loss": 0.798783540725708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.824810" }, { "step": 775, "loss": 0.9298352003097534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:37.958926" }, { "step": 776, "loss": 0.7622988224029541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.075090" }, { "step": 777, "loss": 0.8714120388031006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.179194" }, { "step": 778, "loss": 0.6416409611701965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.279058" }, { "step": 779, "loss": 0.8596643209457397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.370564" }, { "step": 780, "loss": 0.8863228559494019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.456191" }, { "step": 781, "loss": 1.041957139968872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.550285" }, { "step": 782, "loss": 0.7969785928726196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.641669" }, { "step": 783, "loss": 1.112534999847412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.731699" }, { "step": 784, "loss": 0.9823282957077026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.816698" }, { "step": 785, "loss": 0.39879417419433594, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.901469" }, { "step": 786, "loss": 0.8305615186691284, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:38.987229" }, { "step": 787, "loss": 0.4936663508415222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.073113" }, { "step": 788, "loss": 0.9185281991958618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.208385" }, { "step": 789, "loss": 0.6829924583435059, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.305448" }, { "step": 790, "loss": 1.0110011100769043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.396003" }, { "step": 791, "loss": 0.7814629673957825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.480266" }, { "step": 792, "loss": 0.5811723470687866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.573799" }, { "step": 793, "loss": 0.5993483662605286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.667406" }, { "step": 794, "loss": 0.697442889213562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.758731" }, { "step": 795, "loss": 0.896669864654541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.872628" }, { "step": 796, "loss": 0.7674007415771484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:39.983836" }, { "step": 797, "loss": 0.9166538715362549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.075045" }, { "step": 798, "loss": 1.0593212842941284, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.200934" }, { "step": 799, "loss": 0.8726993799209595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.317616" }, { "step": 800, "loss": 0.6590849161148071, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.417758" }, { "step": 801, "loss": 0.846345067024231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.511562" }, { "step": 802, "loss": 0.7135627269744873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.608696" }, { "step": 803, "loss": 0.7592572569847107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.701947" }, { "step": 804, "loss": 1.1060441732406616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.812527" }, { "step": 805, "loss": 0.7281088829040527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:40.907647" }, { "step": 806, "loss": 0.8787092566490173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.025685" }, { "step": 807, "loss": 0.6509213447570801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.124289" }, { "step": 808, "loss": 1.037445306777954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.218596" }, { "step": 809, "loss": 0.7524062395095825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.314693" }, { "step": 810, "loss": 1.0077239274978638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.404751" }, { "step": 811, "loss": 0.9738563299179077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.490184" }, { "step": 812, "loss": 0.9002560377120972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.609549" }, { "step": 813, "loss": 0.8296515345573425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.698313" }, { "step": 814, "loss": 0.770193874835968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.790491" }, { "step": 815, "loss": 0.8621568083763123, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.874556" }, { "step": 816, "loss": 0.6938713192939758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:41.963940" }, { "step": 817, "loss": 0.7561683058738708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.056349" }, { "step": 818, "loss": 0.8402175903320312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.165503" }, { "step": 819, "loss": 0.6871495246887207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.264577" }, { "step": 820, "loss": 1.072792649269104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.352669" }, { "step": 821, "loss": 0.7718715071678162, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.451864" }, { "step": 822, "loss": 0.6868950128555298, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.537122" }, { "step": 823, "loss": 0.6652205586433411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.629543" }, { "step": 824, "loss": 0.7605710029602051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.723944" }, { "step": 825, "loss": 0.7195290923118591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.816341" }, { "step": 826, "loss": 0.7403081655502319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.908807" }, { "step": 827, "loss": 0.784052312374115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:42.996253" }, { "step": 828, "loss": 1.1284081935882568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.121629" }, { "step": 829, "loss": 0.5696630477905273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.221038" }, { "step": 830, "loss": 0.7261099815368652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.312680" }, { "step": 831, "loss": 0.9081183671951294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.411803" }, { "step": 832, "loss": 0.8278322219848633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.509589" }, { "step": 833, "loss": 0.6707237958908081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.593833" }, { "step": 834, "loss": 0.9572373628616333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.686717" }, { "step": 835, "loss": 0.6405086517333984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.773254" }, { "step": 836, "loss": 0.9237533807754517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.888305" }, { "step": 837, "loss": 0.8497680425643921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:43.982101" }, { "step": 838, "loss": 0.6642113924026489, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.072126" }, { "step": 839, "loss": 0.5213629603385925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.165468" }, { "step": 840, "loss": 1.106764793395996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.249106" }, { "step": 841, "loss": 0.9231554269790649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.342913" }, { "step": 842, "loss": 0.8193601965904236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.438867" }, { "step": 843, "loss": 0.6418062448501587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.531733" }, { "step": 844, "loss": 1.0514140129089355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.648268" }, { "step": 845, "loss": 0.6502397060394287, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.735660" }, { "step": 846, "loss": 0.5613604784011841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.820864" }, { "step": 847, "loss": 0.5667914152145386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:44.920157" }, { "step": 848, "loss": 0.9573049545288086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.016942" }, { "step": 849, "loss": 0.763053297996521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.104749" }, { "step": 850, "loss": 0.5323175191879272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.193566" }, { "step": 851, "loss": 0.7126999497413635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.285738" }, { "step": 852, "loss": 1.175980806350708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.395827" }, { "step": 853, "loss": 1.1283702850341797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.493520" }, { "step": 854, "loss": 0.7567734718322754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.586734" }, { "step": 855, "loss": 0.5159550905227661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.674130" }, { "step": 856, "loss": 0.9190926551818848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.790764" }, { "step": 857, "loss": 1.04990553855896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.888333" }, { "step": 858, "loss": 0.6491147875785828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:45.978006" }, { "step": 859, "loss": 0.7162141799926758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.062614" }, { "step": 860, "loss": 0.8474727869033813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.161535" }, { "step": 861, "loss": 1.0896774530410767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.270612" }, { "step": 862, "loss": 0.7819879651069641, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.357722" }, { "step": 863, "loss": 0.9761104583740234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.443743" }, { "step": 864, "loss": 0.5577294826507568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.535081" }, { "step": 865, "loss": 0.8035650253295898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.621256" }, { "step": 866, "loss": 1.0466394424438477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.740177" }, { "step": 867, "loss": 1.1098616123199463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.825643" }, { "step": 868, "loss": 0.7368583083152771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:46.937065" }, { "step": 869, "loss": 0.5674487352371216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.030775" }, { "step": 870, "loss": 0.8945719003677368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.149263" }, { "step": 871, "loss": 0.9351997375488281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.236417" }, { "step": 872, "loss": 0.5319985151290894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.335375" }, { "step": 873, "loss": 0.5695075392723083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.428645" }, { "step": 874, "loss": 1.0491480827331543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.537998" }, { "step": 875, "loss": 0.6615697741508484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.639389" }, { "step": 876, "loss": 0.9285553693771362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.755511" }, { "step": 877, "loss": 0.9260551333427429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.846958" }, { "step": 878, "loss": 0.9904400110244751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:47.935686" }, { "step": 879, "loss": 0.6255174875259399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.020876" }, { "step": 880, "loss": 0.8683861494064331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.107746" }, { "step": 881, "loss": 1.0783017873764038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.206989" }, { "step": 882, "loss": 1.1838805675506592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.324207" }, { "step": 883, "loss": 0.8093264102935791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.409558" }, { "step": 884, "loss": 0.994838535785675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.510412" }, { "step": 885, "loss": 0.6557358503341675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.604686" }, { "step": 886, "loss": 0.7079113721847534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.723610" }, { "step": 887, "loss": 1.2648265361785889, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.811059" }, { "step": 888, "loss": 1.0066027641296387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:48.958476" }, { "step": 889, "loss": 1.1107677221298218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.042972" }, { "step": 890, "loss": 0.8340119123458862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.165307" }, { "step": 891, "loss": 0.6687378287315369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.266539" }, { "step": 892, "loss": 0.5253347158432007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.354936" }, { "step": 893, "loss": 0.7432320713996887, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.439662" }, { "step": 894, "loss": 0.8976137638092041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.531331" }, { "step": 895, "loss": 0.9489121437072754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.622989" }, { "step": 896, "loss": 0.6105759143829346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.714589" }, { "step": 897, "loss": 0.8804389238357544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.803794" }, { "step": 898, "loss": 0.7230123281478882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:49.900872" }, { "step": 899, "loss": 0.6726154685020447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.013640" }, { "step": 900, "loss": 0.5970502495765686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.110851" }, { "step": 901, "loss": 1.0122264623641968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.202263" }, { "step": 902, "loss": 0.7754744291305542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.294082" }, { "step": 903, "loss": 0.5965988636016846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.379155" }, { "step": 904, "loss": 0.9235401153564453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.499418" }, { "step": 905, "loss": 1.3013359308242798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.587016" }, { "step": 906, "loss": 0.9844444990158081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.684672" }, { "step": 907, "loss": 1.0938267707824707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.769910" }, { "step": 908, "loss": 0.719542384147644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.880638" }, { "step": 909, "loss": 0.612686812877655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:50.978630" }, { "step": 910, "loss": 1.0123183727264404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.093182" }, { "step": 911, "loss": 0.8186390399932861, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.204430" }, { "step": 912, "loss": 0.569892168045044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.287101" }, { "step": 913, "loss": 0.6012465357780457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.372794" }, { "step": 914, "loss": 0.6023882627487183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.467748" }, { "step": 915, "loss": 0.8663707971572876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.592117" }, { "step": 916, "loss": 0.8780674338340759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.681221" }, { "step": 917, "loss": 0.7721043825149536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.766646" }, { "step": 918, "loss": 0.8170303106307983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.853569" }, { "step": 919, "loss": 0.894187867641449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:51.943282" }, { "step": 920, "loss": 1.0443658828735352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.075345" }, { "step": 921, "loss": 0.8683757185935974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.172824" }, { "step": 922, "loss": 0.9332163333892822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.274743" }, { "step": 923, "loss": 1.137658715248108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.364231" }, { "step": 924, "loss": 1.1167747974395752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.509170" }, { "step": 925, "loss": 0.6338979005813599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.604590" }, { "step": 926, "loss": 0.7975009679794312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.700164" }, { "step": 927, "loss": 0.9493435621261597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.821708" }, { "step": 928, "loss": 0.5481773018836975, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:52.911196" }, { "step": 929, "loss": 0.9977529048919678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.023811" }, { "step": 930, "loss": 0.8228853940963745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.113862" }, { "step": 931, "loss": 1.1117947101593018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.203337" }, { "step": 932, "loss": 0.8600997924804688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.299455" }, { "step": 933, "loss": 1.0831177234649658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.397536" }, { "step": 934, "loss": 0.989351749420166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.484735" }, { "step": 935, "loss": 0.8009433746337891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.570619" }, { "step": 936, "loss": 0.799956202507019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.654592" }, { "step": 937, "loss": 0.7885302305221558, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.757769" }, { "step": 938, "loss": 0.6349055767059326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.858537" }, { "step": 939, "loss": 0.713094174861908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:53.943162" }, { "step": 940, "loss": 0.9391717910766602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.034711" }, { "step": 941, "loss": 0.43561673164367676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.126796" }, { "step": 942, "loss": 1.15494704246521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.212386" }, { "step": 943, "loss": 1.101219654083252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.321511" }, { "step": 944, "loss": 1.093763828277588, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.443346" }, { "step": 945, "loss": 1.2654218673706055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.536272" }, { "step": 946, "loss": 0.7692990303039551, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.620321" }, { "step": 947, "loss": 0.7055923938751221, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.706121" }, { "step": 948, "loss": 0.7739092707633972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.796455" }, { "step": 949, "loss": 0.5255370736122131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.888891" }, { "step": 950, "loss": 0.642512321472168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:54.982891" }, { "step": 951, "loss": 0.8723102807998657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.099874" }, { "step": 952, "loss": 0.9509286880493164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.192826" }, { "step": 953, "loss": 0.6407347917556763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.283261" }, { "step": 954, "loss": 0.7975196242332458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.375937" }, { "step": 955, "loss": 0.6332718133926392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.468446" }, { "step": 956, "loss": 0.737233579158783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.559957" }, { "step": 957, "loss": 1.0208401679992676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.674746" }, { "step": 958, "loss": 1.0235768556594849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.779152" }, { "step": 959, "loss": 1.0259186029434204, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.864542" }, { "step": 960, "loss": 0.8962245583534241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:55.953118" }, { "step": 961, "loss": 0.7522847652435303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.053426" }, { "step": 962, "loss": 0.8101009130477905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.143339" }, { "step": 963, "loss": 0.7715305685997009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.235563" }, { "step": 964, "loss": 0.9338061809539795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.327791" }, { "step": 965, "loss": 1.0399634838104248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.464506" }, { "step": 966, "loss": 0.5123656988143921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.554255" }, { "step": 967, "loss": 0.7107004523277283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.667312" }, { "step": 968, "loss": 0.5666841268539429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.753531" }, { "step": 969, "loss": 0.9610691666603088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.866236" }, { "step": 970, "loss": 1.0670411586761475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:56.959932" }, { "step": 971, "loss": 0.5621532201766968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.058341" }, { "step": 972, "loss": 0.5852326154708862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.150613" }, { "step": 973, "loss": 0.7150869369506836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.267756" }, { "step": 974, "loss": 1.041925311088562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.353640" }, { "step": 975, "loss": 0.9414845705032349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.439597" }, { "step": 976, "loss": 0.6378811001777649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.527719" }, { "step": 977, "loss": 0.6231802701950073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.619957" }, { "step": 978, "loss": 0.9558529853820801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.708233" }, { "step": 979, "loss": 0.9441369771957397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.794291" }, { "step": 980, "loss": 1.131023645401001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.881033" }, { "step": 981, "loss": 0.9189444780349731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:57.978203" }, { "step": 982, "loss": 0.9463452100753784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.095562" }, { "step": 983, "loss": 0.8705431222915649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.185975" }, { "step": 984, "loss": 0.8644773960113525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.269902" }, { "step": 985, "loss": 0.7041594982147217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.365662" }, { "step": 986, "loss": 0.595238208770752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.451944" }, { "step": 987, "loss": 0.9648890495300293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.574834" }, { "step": 988, "loss": 0.5794085264205933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.673028" }, { "step": 989, "loss": 0.7614667415618896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.758812" }, { "step": 990, "loss": 1.1193681955337524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.856151" }, { "step": 991, "loss": 0.7818245887756348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:58.946607" }, { "step": 992, "loss": 0.939274787902832, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.032148" }, { "step": 993, "loss": 0.48655781149864197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.120980" }, { "step": 994, "loss": 0.6364926099777222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.217955" }, { "step": 995, "loss": 0.5788198113441467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.307564" }, { "step": 996, "loss": 0.7223525047302246, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.408483" }, { "step": 997, "loss": 0.6611890196800232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.493177" }, { "step": 998, "loss": 0.7040435075759888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.579182" }, { "step": 999, "loss": 0.6256853342056274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.684198" }, { "step": 1000, "loss": 0.7186115980148315, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:24:59.768886" }, { "step": 1001, "loss": 0.795853316783905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.450941" }, { "step": 1002, "loss": 0.7505607008934021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.545517" }, { "step": 1003, "loss": 0.7300190925598145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.639534" }, { "step": 1004, "loss": 0.9010558724403381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.739421" }, { "step": 1005, "loss": 0.7855645418167114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.840430" }, { "step": 1006, "loss": 1.0798338651657104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:22.954992" }, { "step": 1007, "loss": 0.6218136548995972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.048228" }, { "step": 1008, "loss": 0.7417478561401367, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.133885" }, { "step": 1009, "loss": 0.9390134811401367, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.241676" }, { "step": 1010, "loss": 0.5621345639228821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.345892" }, { "step": 1011, "loss": 0.9872689247131348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.443825" }, { "step": 1012, "loss": 0.7719905376434326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.538073" }, { "step": 1013, "loss": 1.062432050704956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.624813" }, { "step": 1014, "loss": 1.1068671941757202, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.746651" }, { "step": 1015, "loss": 0.7877939939498901, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.844590" }, { "step": 1016, "loss": 0.9201746582984924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:23.932881" }, { "step": 1017, "loss": 0.513413667678833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.021678" }, { "step": 1018, "loss": 0.6989449262619019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.125417" }, { "step": 1019, "loss": 0.7305814027786255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.216340" }, { "step": 1020, "loss": 0.7984755039215088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.301957" }, { "step": 1021, "loss": 0.8523383140563965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.398840" }, { "step": 1022, "loss": 0.5797805190086365, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.490631" }, { "step": 1023, "loss": 0.909878671169281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.576062" }, { "step": 1024, "loss": 0.7937849760055542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.666832" }, { "step": 1025, "loss": 1.1374636888504028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.781630" }, { "step": 1026, "loss": 1.0318334102630615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.870695" }, { "step": 1027, "loss": 0.8786232471466064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:24.958408" }, { "step": 1028, "loss": 0.5576431155204773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.046309" }, { "step": 1029, "loss": 0.7726000547409058, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.136615" }, { "step": 1030, "loss": 0.6977241039276123, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.246415" }, { "step": 1031, "loss": 0.8847371339797974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.350554" }, { "step": 1032, "loss": 0.652221143245697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.437554" }, { "step": 1033, "loss": 0.7560689449310303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.538961" }, { "step": 1034, "loss": 0.7931987643241882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.628618" }, { "step": 1035, "loss": 0.7169964909553528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.732929" }, { "step": 1036, "loss": 0.90721595287323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.818441" }, { "step": 1037, "loss": 0.8393386006355286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:25.941322" }, { "step": 1038, "loss": 0.8964701890945435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.032790" }, { "step": 1039, "loss": 0.6255829334259033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.145852" }, { "step": 1040, "loss": 0.8110803365707397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.241291" }, { "step": 1041, "loss": 0.6484652757644653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.333617" }, { "step": 1042, "loss": 0.9432436227798462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.420652" }, { "step": 1043, "loss": 0.7818832397460938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.512220" }, { "step": 1044, "loss": 0.5516683459281921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.603908" }, { "step": 1045, "loss": 0.9507326483726501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.720990" }, { "step": 1046, "loss": 1.00033700466156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.835235" }, { "step": 1047, "loss": 1.206046223640442, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:26.927808" }, { "step": 1048, "loss": 0.6940313577651978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.047636" }, { "step": 1049, "loss": 1.0129690170288086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.159181" }, { "step": 1050, "loss": 0.9849637746810913, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.245798" }, { "step": 1051, "loss": 1.0722110271453857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.331882" }, { "step": 1052, "loss": 0.860036313533783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.424940" }, { "step": 1053, "loss": 0.9465929269790649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.535312" }, { "step": 1054, "loss": 0.9623941779136658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.646630" }, { "step": 1055, "loss": 0.37416765093803406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.733743" }, { "step": 1056, "loss": 0.715760350227356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.849760" }, { "step": 1057, "loss": 0.8895492553710938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:27.943198" }, { "step": 1058, "loss": 1.0883322954177856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.092754" }, { "step": 1059, "loss": 1.1264195442199707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.188626" }, { "step": 1060, "loss": 0.7757364511489868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.284869" }, { "step": 1061, "loss": 0.9495508074760437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.390336" }, { "step": 1062, "loss": 0.49181225895881653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.477417" }, { "step": 1063, "loss": 0.8831068277359009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.572451" }, { "step": 1064, "loss": 0.4590335786342621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.659936" }, { "step": 1065, "loss": 0.8069454431533813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.765943" }, { "step": 1066, "loss": 0.9429265260696411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.887863" }, { "step": 1067, "loss": 0.7611669301986694, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:28.973086" }, { "step": 1068, "loss": 1.108799695968628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.090645" }, { "step": 1069, "loss": 0.7686221599578857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.188450" }, { "step": 1070, "loss": 0.6078580021858215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.281518" }, { "step": 1071, "loss": 0.5938620567321777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.378215" }, { "step": 1072, "loss": 0.8484303951263428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.470331" }, { "step": 1073, "loss": 0.8215440511703491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.595094" }, { "step": 1074, "loss": 0.9304682612419128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.683004" }, { "step": 1075, "loss": 0.9215312004089355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.770359" }, { "step": 1076, "loss": 0.7803306579589844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.869347" }, { "step": 1077, "loss": 0.7618107795715332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:29.964113" }, { "step": 1078, "loss": 1.076745867729187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.077152" }, { "step": 1079, "loss": 0.9359937906265259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.161954" }, { "step": 1080, "loss": 0.6364263296127319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.250986" }, { "step": 1081, "loss": 0.8905977010726929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.344615" }, { "step": 1082, "loss": 0.6216539144515991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.431498" }, { "step": 1083, "loss": 0.7572320699691772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.523083" }, { "step": 1084, "loss": 0.507041335105896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.615766" }, { "step": 1085, "loss": 1.0913338661193848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.708533" }, { "step": 1086, "loss": 0.6532357335090637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.800477" }, { "step": 1087, "loss": 1.3010938167572021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.888741" }, { "step": 1088, "loss": 0.7272790670394897, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:30.990535" }, { "step": 1089, "loss": 0.8479068279266357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.082737" }, { "step": 1090, "loss": 0.9586663246154785, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.174295" }, { "step": 1091, "loss": 0.8489705324172974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.259389" }, { "step": 1092, "loss": 0.7998107075691223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.345449" }, { "step": 1093, "loss": 0.9847201108932495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.431942" }, { "step": 1094, "loss": 0.693953275680542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.522922" }, { "step": 1095, "loss": 1.2045584917068481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.631743" }, { "step": 1096, "loss": 0.7299104928970337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.723460" }, { "step": 1097, "loss": 0.6230279803276062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.814440" }, { "step": 1098, "loss": 0.8806151151657104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:31.932133" }, { "step": 1099, "loss": 0.5007691383361816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.017920" }, { "step": 1100, "loss": 0.7083829641342163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.109518" }, { "step": 1101, "loss": 0.8995263576507568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.213650" }, { "step": 1102, "loss": 1.1776671409606934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.299725" }, { "step": 1103, "loss": 0.9990439414978027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.418338" }, { "step": 1104, "loss": 1.3340203762054443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.503444" }, { "step": 1105, "loss": 0.8043566942214966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.631726" }, { "step": 1106, "loss": 0.6155959367752075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.727028" }, { "step": 1107, "loss": 0.9049456119537354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.817043" }, { "step": 1108, "loss": 0.7837140560150146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.903733" }, { "step": 1109, "loss": 0.9468764066696167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:32.996792" }, { "step": 1110, "loss": 0.8820022344589233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.085446" }, { "step": 1111, "loss": 0.9183668494224548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.184432" }, { "step": 1112, "loss": 0.6364180445671082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.271540" }, { "step": 1113, "loss": 0.6314646005630493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.359185" }, { "step": 1114, "loss": 0.7831809520721436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.444165" }, { "step": 1115, "loss": 0.9027881622314453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.529461" }, { "step": 1116, "loss": 0.7925407886505127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.618701" }, { "step": 1117, "loss": 0.8890613317489624, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.744306" }, { "step": 1118, "loss": 1.0543158054351807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.853741" }, { "step": 1119, "loss": 0.8576157093048096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:33.967222" }, { "step": 1120, "loss": 0.8729807138442993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.078519" }, { "step": 1121, "loss": 1.0885539054870605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.190900" }, { "step": 1122, "loss": 0.9534258246421814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.301550" }, { "step": 1123, "loss": 0.9666721820831299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.389547" }, { "step": 1124, "loss": 0.9688005447387695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.473910" }, { "step": 1125, "loss": 0.6201977133750916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.561391" }, { "step": 1126, "loss": 0.9023157358169556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.652986" }, { "step": 1127, "loss": 0.642458438873291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.755427" }, { "step": 1128, "loss": 0.6112734079360962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.852208" }, { "step": 1129, "loss": 0.6576547026634216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:34.946960" }, { "step": 1130, "loss": 0.5337916016578674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.036854" }, { "step": 1131, "loss": 0.8383836150169373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.164467" }, { "step": 1132, "loss": 0.9260396957397461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.251530" }, { "step": 1133, "loss": 0.7280505895614624, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.343220" }, { "step": 1134, "loss": 0.7967426776885986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.428434" }, { "step": 1135, "loss": 0.8919845819473267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.511342" }, { "step": 1136, "loss": 1.0676597356796265, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.627315" }, { "step": 1137, "loss": 0.8370925784111023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.738774" }, { "step": 1138, "loss": 0.4879205822944641, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.827843" }, { "step": 1139, "loss": 0.8432517051696777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:35.944344" }, { "step": 1140, "loss": 0.8302839398384094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.032344" }, { "step": 1141, "loss": 1.0536046028137207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.151913" }, { "step": 1142, "loss": 0.6908317804336548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.262738" }, { "step": 1143, "loss": 0.7739158868789673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.361535" }, { "step": 1144, "loss": 0.9032776355743408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.473786" }, { "step": 1145, "loss": 0.7701367735862732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.574323" }, { "step": 1146, "loss": 0.5805445313453674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.674134" }, { "step": 1147, "loss": 0.6107333302497864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.771134" }, { "step": 1148, "loss": 0.723787248134613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.863951" }, { "step": 1149, "loss": 0.6818572878837585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:36.952868" }, { "step": 1150, "loss": 0.6889349222183228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.069695" }, { "step": 1151, "loss": 0.6339285373687744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.156894" }, { "step": 1152, "loss": 1.0264406204223633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.241491" }, { "step": 1153, "loss": 0.5685117244720459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.326422" }, { "step": 1154, "loss": 0.7812444567680359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.425452" }, { "step": 1155, "loss": 0.9520845413208008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.515646" }, { "step": 1156, "loss": 0.9520198106765747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.636130" }, { "step": 1157, "loss": 1.0216708183288574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.745530" }, { "step": 1158, "loss": 0.9716659784317017, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.843293" }, { "step": 1159, "loss": 1.097899317741394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:37.931413" }, { "step": 1160, "loss": 0.9400588274002075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.015752" }, { "step": 1161, "loss": 0.6505304574966431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.100687" }, { "step": 1162, "loss": 0.7416532635688782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.195402" }, { "step": 1163, "loss": 0.6241315603256226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.288424" }, { "step": 1164, "loss": 1.190395474433899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.384492" }, { "step": 1165, "loss": 0.6430078744888306, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.469846" }, { "step": 1166, "loss": 0.5865511894226074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.567782" }, { "step": 1167, "loss": 0.49096375703811646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.660559" }, { "step": 1168, "loss": 0.832275927066803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.750360" }, { "step": 1169, "loss": 1.0066118240356445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.884039" }, { "step": 1170, "loss": 0.7273716330528259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:38.979784" }, { "step": 1171, "loss": 1.0914371013641357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.124207" }, { "step": 1172, "loss": 0.7871395349502563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.210098" }, { "step": 1173, "loss": 0.9345299005508423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.302209" }, { "step": 1174, "loss": 0.9935762882232666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.387149" }, { "step": 1175, "loss": 0.5315535664558411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.480062" }, { "step": 1176, "loss": 0.6519883275032043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.568818" }, { "step": 1177, "loss": 0.8018367886543274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.680786" }, { "step": 1178, "loss": 0.5586428642272949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.775612" }, { "step": 1179, "loss": 0.8014699816703796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.882622" }, { "step": 1180, "loss": 0.6596553921699524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:39.973774" }, { "step": 1181, "loss": 0.9835232496261597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.076319" }, { "step": 1182, "loss": 0.8291329145431519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.162439" }, { "step": 1183, "loss": 0.7918035984039307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.248923" }, { "step": 1184, "loss": 1.1352126598358154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.362898" }, { "step": 1185, "loss": 0.6893708109855652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.453004" }, { "step": 1186, "loss": 1.2181825637817383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.565089" }, { "step": 1187, "loss": 0.7276662588119507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.650296" }, { "step": 1188, "loss": 0.9785679578781128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.739741" }, { "step": 1189, "loss": 1.2663332223892212, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.829286" }, { "step": 1190, "loss": 1.0501091480255127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:40.949117" }, { "step": 1191, "loss": 0.7406513690948486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.042302" }, { "step": 1192, "loss": 0.9604898691177368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.129367" }, { "step": 1193, "loss": 0.8063204288482666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.220063" }, { "step": 1194, "loss": 0.9113061428070068, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.305177" }, { "step": 1195, "loss": 0.8765519261360168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.398939" }, { "step": 1196, "loss": 0.6850883960723877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.487095" }, { "step": 1197, "loss": 0.8439918756484985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.574671" }, { "step": 1198, "loss": 0.7656416296958923, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.661433" }, { "step": 1199, "loss": 0.7682062387466431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.755030" }, { "step": 1200, "loss": 0.9906343221664429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.849591" }, { "step": 1201, "loss": 0.6151300668716431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:41.946455" }, { "step": 1202, "loss": 1.0350068807601929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.031227" }, { "step": 1203, "loss": 0.8787580728530884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.119193" }, { "step": 1204, "loss": 0.9935388565063477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.206164" }, { "step": 1205, "loss": 1.0060324668884277, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.351090" }, { "step": 1206, "loss": 0.9971094131469727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.439132" }, { "step": 1207, "loss": 0.63760906457901, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.536969" }, { "step": 1208, "loss": 0.7422930002212524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.660972" }, { "step": 1209, "loss": 0.8362013697624207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.752978" }, { "step": 1210, "loss": 0.8192808628082275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.841179" }, { "step": 1211, "loss": 0.8310290575027466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:42.934596" }, { "step": 1212, "loss": 0.8264589905738831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.020540" }, { "step": 1213, "loss": 0.9577540159225464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.105344" }, { "step": 1214, "loss": 0.47627493739128113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.195222" }, { "step": 1215, "loss": 0.8174174427986145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.282713" }, { "step": 1216, "loss": 0.9665852785110474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.395289" }, { "step": 1217, "loss": 0.8574032783508301, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.480505" }, { "step": 1218, "loss": 0.8094152808189392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.565957" }, { "step": 1219, "loss": 0.8390383720397949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.692539" }, { "step": 1220, "loss": 0.8677798509597778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.780814" }, { "step": 1221, "loss": 0.9206032156944275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.874587" }, { "step": 1222, "loss": 1.1388778686523438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:43.988832" }, { "step": 1223, "loss": 0.7161514759063721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.082222" }, { "step": 1224, "loss": 1.025384545326233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.203637" }, { "step": 1225, "loss": 1.3830586671829224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.295142" }, { "step": 1226, "loss": 0.9831871390342712, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.415095" }, { "step": 1227, "loss": 0.6753019094467163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.502854" }, { "step": 1228, "loss": 0.7302607297897339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.588932" }, { "step": 1229, "loss": 1.2038938999176025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.677207" }, { "step": 1230, "loss": 0.9647438526153564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.789217" }, { "step": 1231, "loss": 0.5741113424301147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.890447" }, { "step": 1232, "loss": 0.9706248044967651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:44.983026" }, { "step": 1233, "loss": 0.6777171492576599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.068663" }, { "step": 1234, "loss": 0.8894506692886353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.154936" }, { "step": 1235, "loss": 0.8353870511054993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.246307" }, { "step": 1236, "loss": 0.890958309173584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.343088" }, { "step": 1237, "loss": 0.8875815868377686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.429529" }, { "step": 1238, "loss": 0.8156763911247253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.515848" }, { "step": 1239, "loss": 0.8412986397743225, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.631873" }, { "step": 1240, "loss": 1.112828254699707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.743115" }, { "step": 1241, "loss": 0.5297660827636719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.835111" }, { "step": 1242, "loss": 0.933273434638977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:45.927537" }, { "step": 1243, "loss": 0.8139809370040894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.013669" }, { "step": 1244, "loss": 0.5253555774688721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.100696" }, { "step": 1245, "loss": 0.508169412612915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.188802" }, { "step": 1246, "loss": 0.87684565782547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.282412" }, { "step": 1247, "loss": 1.0651975870132446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.392834" }, { "step": 1248, "loss": 0.6236328482627869, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.483228" }, { "step": 1249, "loss": 0.8252109885215759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.574160" }, { "step": 1250, "loss": 0.6443029046058655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.666453" }, { "step": 1251, "loss": 0.6429926753044128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.753529" }, { "step": 1252, "loss": 0.799961268901825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.841426" }, { "step": 1253, "loss": 0.4927724599838257, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:46.928501" }, { "step": 1254, "loss": 0.7840350866317749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.017930" }, { "step": 1255, "loss": 1.1031200885772705, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.129244" }, { "step": 1256, "loss": 0.5800918340682983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.221553" }, { "step": 1257, "loss": 0.9207723140716553, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.319731" }, { "step": 1258, "loss": 0.8208332657814026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.417868" }, { "step": 1259, "loss": 0.7033005952835083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.506700" }, { "step": 1260, "loss": 0.7719800472259521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.592405" }, { "step": 1261, "loss": 1.0021041631698608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.704369" }, { "step": 1262, "loss": 1.0678797960281372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.813196" }, { "step": 1263, "loss": 0.7705833315849304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:47.903355" }, { "step": 1264, "loss": 1.1046000719070435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.022500" }, { "step": 1265, "loss": 0.8490549325942993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.137925" }, { "step": 1266, "loss": 0.6284466981887817, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.244589" }, { "step": 1267, "loss": 0.5978412628173828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.329860" }, { "step": 1268, "loss": 0.43704697489738464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.423409" }, { "step": 1269, "loss": 0.41917914152145386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.520276" }, { "step": 1270, "loss": 0.8155714273452759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.612976" }, { "step": 1271, "loss": 0.5244447588920593, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.699956" }, { "step": 1272, "loss": 0.7310545444488525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.796680" }, { "step": 1273, "loss": 0.7948310375213623, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.893341" }, { "step": 1274, "loss": 0.7688277959823608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:48.990982" }, { "step": 1275, "loss": 1.0013947486877441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.076188" }, { "step": 1276, "loss": 0.6355981230735779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.162038" }, { "step": 1277, "loss": 0.4715246260166168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.254658" }, { "step": 1278, "loss": 0.7746362686157227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.374733" }, { "step": 1279, "loss": 0.925260066986084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.466565" }, { "step": 1280, "loss": 0.5621695518493652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.566046" }, { "step": 1281, "loss": 0.7770888805389404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.655396" }, { "step": 1282, "loss": 0.9253700971603394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.767332" }, { "step": 1283, "loss": 0.9130239486694336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.885297" }, { "step": 1284, "loss": 1.1459752321243286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:49.973032" }, { "step": 1285, "loss": 1.0052580833435059, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.084161" }, { "step": 1286, "loss": 0.5300435423851013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.170288" }, { "step": 1287, "loss": 0.769504725933075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.261448" }, { "step": 1288, "loss": 1.1010093688964844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.396489" }, { "step": 1289, "loss": 1.0375827550888062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.506466" }, { "step": 1290, "loss": 1.0388914346694946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.603105" }, { "step": 1291, "loss": 0.807604968547821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.687412" }, { "step": 1292, "loss": 0.6778517961502075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.773145" }, { "step": 1293, "loss": 0.9805058240890503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.858461" }, { "step": 1294, "loss": 0.8442914485931396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:50.985116" }, { "step": 1295, "loss": 0.828373908996582, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.103056" }, { "step": 1296, "loss": 0.7580903768539429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.201622" }, { "step": 1297, "loss": 0.7542917728424072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.287713" }, { "step": 1298, "loss": 0.931371808052063, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.374383" }, { "step": 1299, "loss": 0.871410071849823, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.469465" }, { "step": 1300, "loss": 1.1011686325073242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.582033" }, { "step": 1301, "loss": 0.6524278521537781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.669207" }, { "step": 1302, "loss": 1.0507649183273315, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.762488" }, { "step": 1303, "loss": 0.5671510696411133, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.861481" }, { "step": 1304, "loss": 0.8257695436477661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:51.955359" }, { "step": 1305, "loss": 0.7524343729019165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.041981" }, { "step": 1306, "loss": 0.9303247928619385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.127926" }, { "step": 1307, "loss": 0.6468095779418945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.225029" }, { "step": 1308, "loss": 0.7810192108154297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.318897" }, { "step": 1309, "loss": 1.3610275983810425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.404567" }, { "step": 1310, "loss": 0.6951385736465454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.490147" }, { "step": 1311, "loss": 0.4279547929763794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.582887" }, { "step": 1312, "loss": 0.9291030168533325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.726784" }, { "step": 1313, "loss": 0.602829098701477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.811800" }, { "step": 1314, "loss": 0.8244240283966064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.909042" }, { "step": 1315, "loss": 0.8630656003952026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:52.994400" }, { "step": 1316, "loss": 0.6474165320396423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.086254" }, { "step": 1317, "loss": 0.6155105233192444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.172097" }, { "step": 1318, "loss": 0.7142314910888672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.266019" }, { "step": 1319, "loss": 0.825477659702301, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.358720" }, { "step": 1320, "loss": 1.0064691305160522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.453315" }, { "step": 1321, "loss": 1.2159010171890259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.565006" }, { "step": 1322, "loss": 0.5168448686599731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.651086" }, { "step": 1323, "loss": 0.9717031717300415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.772055" }, { "step": 1324, "loss": 0.5742778182029724, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.859424" }, { "step": 1325, "loss": 1.0147373676300049, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:53.974124" }, { "step": 1326, "loss": 0.6376160383224487, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.067565" }, { "step": 1327, "loss": 0.8630448579788208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.176977" }, { "step": 1328, "loss": 0.8772441148757935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.267921" }, { "step": 1329, "loss": 0.8352408409118652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.355495" }, { "step": 1330, "loss": 0.8143050670623779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.442320" }, { "step": 1331, "loss": 0.9719842672348022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.536574" }, { "step": 1332, "loss": 0.8288818597793579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.625530" }, { "step": 1333, "loss": 0.8148444294929504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.711719" }, { "step": 1334, "loss": 0.6223951578140259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.799224" }, { "step": 1335, "loss": 1.06356942653656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.885351" }, { "step": 1336, "loss": 0.5120475888252258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:54.974964" }, { "step": 1337, "loss": 1.114715576171875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.067192" }, { "step": 1338, "loss": 0.6562968492507935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.152254" }, { "step": 1339, "loss": 0.6546900272369385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.248444" }, { "step": 1340, "loss": 0.7300695180892944, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.332800" }, { "step": 1341, "loss": 1.0420578718185425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.469994" }, { "step": 1342, "loss": 0.561761736869812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.558205" }, { "step": 1343, "loss": 0.6883903741836548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.649401" }, { "step": 1344, "loss": 0.8165489435195923, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.743601" }, { "step": 1345, "loss": 0.9179015159606934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.871768" }, { "step": 1346, "loss": 0.8713082075119019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:55.983419" }, { "step": 1347, "loss": 0.6662948131561279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.075528" }, { "step": 1348, "loss": 0.7121116518974304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.187324" }, { "step": 1349, "loss": 1.119958519935608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.272021" }, { "step": 1350, "loss": 0.8439207077026367, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.363759" }, { "step": 1351, "loss": 0.6983997821807861, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.458278" }, { "step": 1352, "loss": 0.7621984481811523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.574440" }, { "step": 1353, "loss": 0.5928847789764404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.659585" }, { "step": 1354, "loss": 0.7258509397506714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.748436" }, { "step": 1355, "loss": 0.8832218050956726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.855918" }, { "step": 1356, "loss": 0.6429375410079956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:56.943915" }, { "step": 1357, "loss": 1.0396933555603027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.029982" }, { "step": 1358, "loss": 0.45435094833374023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.112484" }, { "step": 1359, "loss": 0.7748469114303589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.209909" }, { "step": 1360, "loss": 0.7862928509712219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.295612" }, { "step": 1361, "loss": 0.9532199501991272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.381513" }, { "step": 1362, "loss": 0.8156052827835083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.467602" }, { "step": 1363, "loss": 0.7562074661254883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.552440" }, { "step": 1364, "loss": 1.0879300832748413, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.644238" }, { "step": 1365, "loss": 0.8034428358078003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.730449" }, { "step": 1366, "loss": 0.879498302936554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.841924" }, { "step": 1367, "loss": 0.542577862739563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:57.940953" }, { "step": 1368, "loss": 0.787277340888977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.026979" }, { "step": 1369, "loss": 0.7463059425354004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.112174" }, { "step": 1370, "loss": 1.030380368232727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.221360" }, { "step": 1371, "loss": 0.5877465605735779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.310278" }, { "step": 1372, "loss": 1.0518743991851807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.435843" }, { "step": 1373, "loss": 0.8090893030166626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.525309" }, { "step": 1374, "loss": 0.9528887271881104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.634342" }, { "step": 1375, "loss": 0.7483019232749939, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.721337" }, { "step": 1376, "loss": 0.795137882232666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.820554" }, { "step": 1377, "loss": 1.0504493713378906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:58.930023" }, { "step": 1378, "loss": 0.9793991446495056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.016326" }, { "step": 1379, "loss": 0.691773533821106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.101282" }, { "step": 1380, "loss": 0.5745719075202942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.192366" }, { "step": 1381, "loss": 1.0375467538833618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.315571" }, { "step": 1382, "loss": 0.6146559715270996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.402589" }, { "step": 1383, "loss": 1.1213276386260986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.513078" }, { "step": 1384, "loss": 0.9412680864334106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.601553" }, { "step": 1385, "loss": 1.066373586654663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.686731" }, { "step": 1386, "loss": 0.6491132378578186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.782291" }, { "step": 1387, "loss": 1.1085803508758545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.869660" }, { "step": 1388, "loss": 0.5148281455039978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:25:59.961884" }, { "step": 1389, "loss": 0.9369708299636841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.049696" }, { "step": 1390, "loss": 0.8686786890029907, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.138471" }, { "step": 1391, "loss": 0.8135048747062683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.256233" }, { "step": 1392, "loss": 0.7361763715744019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.381038" }, { "step": 1393, "loss": 0.6618208289146423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.481163" }, { "step": 1394, "loss": 0.7202247381210327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.573460" }, { "step": 1395, "loss": 0.5800598859786987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.660118" }, { "step": 1396, "loss": 0.764702558517456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.744242" }, { "step": 1397, "loss": 0.7018097639083862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.834524" }, { "step": 1398, "loss": 0.7570836544036865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:00.924515" }, { "step": 1399, "loss": 1.0392673015594482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.017507" }, { "step": 1400, "loss": 0.6255046725273132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.107513" }, { "step": 1401, "loss": 0.9571327567100525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.195711" }, { "step": 1402, "loss": 0.8776367902755737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.280373" }, { "step": 1403, "loss": 0.6336356401443481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.366483" }, { "step": 1404, "loss": 0.7361331582069397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.461149" }, { "step": 1405, "loss": 1.1256130933761597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.548464" }, { "step": 1406, "loss": 0.8668941259384155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.644414" }, { "step": 1407, "loss": 0.785995364189148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.740001" }, { "step": 1408, "loss": 0.7960246801376343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.825309" }, { "step": 1409, "loss": 1.1484529972076416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:01.915742" }, { "step": 1410, "loss": 0.6971302032470703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.007282" }, { "step": 1411, "loss": 0.6052474975585938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.098087" }, { "step": 1412, "loss": 0.5584670305252075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.197245" }, { "step": 1413, "loss": 0.6227949261665344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.282215" }, { "step": 1414, "loss": 1.2273463010787964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.369976" }, { "step": 1415, "loss": 0.5107699632644653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.455180" }, { "step": 1416, "loss": 0.9211674332618713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.541335" }, { "step": 1417, "loss": 0.7596094012260437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.636978" }, { "step": 1418, "loss": 0.6879094839096069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.722075" }, { "step": 1419, "loss": 0.7283205986022949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.808361" }, { "step": 1420, "loss": 0.5282256007194519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.900457" }, { "step": 1421, "loss": 0.7715545892715454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:02.986588" }, { "step": 1422, "loss": 0.6911719441413879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.076064" }, { "step": 1423, "loss": 0.6024216413497925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.170142" }, { "step": 1424, "loss": 1.1700400114059448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.282146" }, { "step": 1425, "loss": 0.9393367767333984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.370530" }, { "step": 1426, "loss": 0.7373405694961548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.464937" }, { "step": 1427, "loss": 0.9315598011016846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.588332" }, { "step": 1428, "loss": 0.5354658365249634, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.687202" }, { "step": 1429, "loss": 0.9601385593414307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.809697" }, { "step": 1430, "loss": 1.2421863079071045, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:03.923780" }, { "step": 1431, "loss": 1.144200086593628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.037391" }, { "step": 1432, "loss": 0.7681925892829895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.136841" }, { "step": 1433, "loss": 0.6077857613563538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.222318" }, { "step": 1434, "loss": 0.9566330909729004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.316656" }, { "step": 1435, "loss": 0.5346153974533081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.429949" }, { "step": 1436, "loss": 1.0377737283706665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.521456" }, { "step": 1437, "loss": 0.9465749263763428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.618662" }, { "step": 1438, "loss": 1.079223394393921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.716594" }, { "step": 1439, "loss": 0.8021069765090942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.813556" }, { "step": 1440, "loss": 0.684778094291687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.897435" }, { "step": 1441, "loss": 1.0960487127304077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:04.990359" }, { "step": 1442, "loss": 0.7083713412284851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.084654" }, { "step": 1443, "loss": 0.6576230525970459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.170782" }, { "step": 1444, "loss": 0.9445117712020874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.257116" }, { "step": 1445, "loss": 0.6391264200210571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.354696" }, { "step": 1446, "loss": 0.6814266443252563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.437709" }, { "step": 1447, "loss": 0.8106536865234375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.530404" }, { "step": 1448, "loss": 0.9683991074562073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.618096" }, { "step": 1449, "loss": 0.958247184753418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.735208" }, { "step": 1450, "loss": 0.8211939334869385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.856837" }, { "step": 1451, "loss": 0.5987973213195801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:05.943714" }, { "step": 1452, "loss": 1.0494804382324219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.052033" }, { "step": 1453, "loss": 0.8410564661026001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.168666" }, { "step": 1454, "loss": 0.6569469571113586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.256271" }, { "step": 1455, "loss": 0.7755404710769653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.367629" }, { "step": 1456, "loss": 0.8595168590545654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.458886" }, { "step": 1457, "loss": 0.7490878105163574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.545320" }, { "step": 1458, "loss": 0.6204314231872559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.655499" }, { "step": 1459, "loss": 0.5994475483894348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.741237" }, { "step": 1460, "loss": 0.6752996444702148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.833965" }, { "step": 1461, "loss": 0.8837582468986511, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:06.932441" }, { "step": 1462, "loss": 0.435092568397522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.017232" }, { "step": 1463, "loss": 0.7778792977333069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.104821" }, { "step": 1464, "loss": 0.7172398567199707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.197594" }, { "step": 1465, "loss": 1.040575623512268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.308939" }, { "step": 1466, "loss": 0.5442305207252502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.408725" }, { "step": 1467, "loss": 1.1512658596038818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.494869" }, { "step": 1468, "loss": 0.5602343082427979, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.587859" }, { "step": 1469, "loss": 0.8491759300231934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.679773" }, { "step": 1470, "loss": 0.9644253253936768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.781231" }, { "step": 1471, "loss": 0.861324667930603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.883120" }, { "step": 1472, "loss": 0.6841694712638855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:07.971257" }, { "step": 1473, "loss": 0.8362206816673279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.072702" }, { "step": 1474, "loss": 0.5605000257492065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.164668" }, { "step": 1475, "loss": 0.8246414661407471, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.285819" }, { "step": 1476, "loss": 0.7721787691116333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.403176" }, { "step": 1477, "loss": 0.4686989486217499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.495833" }, { "step": 1478, "loss": 0.7064263820648193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.588620" }, { "step": 1479, "loss": 0.8174221515655518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.674064" }, { "step": 1480, "loss": 0.9496350884437561, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.770428" }, { "step": 1481, "loss": 0.7544870972633362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.862432" }, { "step": 1482, "loss": 0.6121529936790466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:08.954380" }, { "step": 1483, "loss": 0.6790629625320435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.072076" }, { "step": 1484, "loss": 1.0299186706542969, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.186669" }, { "step": 1485, "loss": 0.5644404292106628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.277248" }, { "step": 1486, "loss": 0.8615404367446899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.371092" }, { "step": 1487, "loss": 0.8207064867019653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.456147" }, { "step": 1488, "loss": 0.5968309640884399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.546330" }, { "step": 1489, "loss": 0.8281489014625549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.674981" }, { "step": 1490, "loss": 1.1054582595825195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.789982" }, { "step": 1491, "loss": 0.5893365144729614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.874319" }, { "step": 1492, "loss": 0.6241584420204163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:09.963477" }, { "step": 1493, "loss": 0.7177639603614807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.084308" }, { "step": 1494, "loss": 0.8536834120750427, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.193257" }, { "step": 1495, "loss": 0.41816043853759766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.280793" }, { "step": 1496, "loss": 0.8183603286743164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.376927" }, { "step": 1497, "loss": 0.6891762614250183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.465791" }, { "step": 1498, "loss": 0.5402716398239136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.558989" }, { "step": 1499, "loss": 0.8204569816589355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.647482" }, { "step": 1500, "loss": 0.7325376272201538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:10.740558" }, { "step": 1501, "loss": 0.7187865972518921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:33.500629" }, { "step": 1502, "loss": 0.7106460332870483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:33.594822" }, { "step": 1503, "loss": 0.8585537672042847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:33.717598" }, { "step": 1504, "loss": 0.6166272163391113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:33.809169" }, { "step": 1505, "loss": 0.7486084699630737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:33.900261" }, { "step": 1506, "loss": 0.7847186326980591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.016092" }, { "step": 1507, "loss": 1.027967929840088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.104213" }, { "step": 1508, "loss": 0.5093907117843628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.204141" }, { "step": 1509, "loss": 0.7118560075759888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.288376" }, { "step": 1510, "loss": 0.6414411664009094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.384153" }, { "step": 1511, "loss": 0.6267388463020325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.470823" }, { "step": 1512, "loss": 0.32387349009513855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.563122" }, { "step": 1513, "loss": 0.8280535936355591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.657386" }, { "step": 1514, "loss": 1.0401893854141235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.742505" }, { "step": 1515, "loss": 0.5590939521789551, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.828076" }, { "step": 1516, "loss": 0.7083680033683777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:34.957180" }, { "step": 1517, "loss": 0.8127727508544922, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.048506" }, { "step": 1518, "loss": 0.5258845686912537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.142760" }, { "step": 1519, "loss": 0.8796089887619019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.237347" }, { "step": 1520, "loss": 1.000694990158081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.324150" }, { "step": 1521, "loss": 0.6381533145904541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.420764" }, { "step": 1522, "loss": 0.9343708753585815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.529197" }, { "step": 1523, "loss": 0.4290573000907898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.619649" }, { "step": 1524, "loss": 0.9562275409698486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.733394" }, { "step": 1525, "loss": 0.8772760033607483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.836747" }, { "step": 1526, "loss": 0.8839503526687622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:35.922127" }, { "step": 1527, "loss": 0.9411407709121704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.040021" }, { "step": 1528, "loss": 0.8386807441711426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.133154" }, { "step": 1529, "loss": 0.914747953414917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.219976" }, { "step": 1530, "loss": 1.0330967903137207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.331938" }, { "step": 1531, "loss": 0.7893034815788269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.423641" }, { "step": 1532, "loss": 0.5597468018531799, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.515859" }, { "step": 1533, "loss": 0.9258995056152344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.629171" }, { "step": 1534, "loss": 0.7751642465591431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.725476" }, { "step": 1535, "loss": 0.7131752371788025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.809931" }, { "step": 1536, "loss": 0.5177452564239502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:36.902556" }, { "step": 1537, "loss": 1.0851553678512573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.002641" }, { "step": 1538, "loss": 0.8221091032028198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.106011" }, { "step": 1539, "loss": 0.8442791104316711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.192470" }, { "step": 1540, "loss": 0.9485673904418945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.284096" }, { "step": 1541, "loss": 1.0784008502960205, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.402830" }, { "step": 1542, "loss": 0.48873472213745117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.491993" }, { "step": 1543, "loss": 0.692301332950592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.592137" }, { "step": 1544, "loss": 0.5088498592376709, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.683878" }, { "step": 1545, "loss": 0.736901044845581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.775520" }, { "step": 1546, "loss": 0.5156732797622681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.861257" }, { "step": 1547, "loss": 0.6814768314361572, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:37.958708" }, { "step": 1548, "loss": 1.4189262390136719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.045331" }, { "step": 1549, "loss": 0.49195054173469543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.138394" }, { "step": 1550, "loss": 0.558677077293396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.230036" }, { "step": 1551, "loss": 0.7532663345336914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.323188" }, { "step": 1552, "loss": 0.7877296209335327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.414301" }, { "step": 1553, "loss": 0.5422468185424805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.512802" }, { "step": 1554, "loss": 1.0028620958328247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.601169" }, { "step": 1555, "loss": 0.8924840688705444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.701257" }, { "step": 1556, "loss": 0.9331680536270142, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.798685" }, { "step": 1557, "loss": 0.809785008430481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:38.886791" }, { "step": 1558, "loss": 1.0668014287948608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.029293" }, { "step": 1559, "loss": 0.9430599808692932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.117665" }, { "step": 1560, "loss": 0.7307447791099548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.236916" }, { "step": 1561, "loss": 0.9169729948043823, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.323876" }, { "step": 1562, "loss": 0.9039109945297241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.437935" }, { "step": 1563, "loss": 0.7082564830780029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.534412" }, { "step": 1564, "loss": 0.9417604207992554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.627845" }, { "step": 1565, "loss": 0.9965002536773682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.714590" }, { "step": 1566, "loss": 0.9232640266418457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.822280" }, { "step": 1567, "loss": 0.8627521395683289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:39.918866" }, { "step": 1568, "loss": 0.9412593841552734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.007812" }, { "step": 1569, "loss": 0.7808510065078735, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.092139" }, { "step": 1570, "loss": 0.6839473843574524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.184640" }, { "step": 1571, "loss": 0.8769899606704712, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.301983" }, { "step": 1572, "loss": 0.4146837890148163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.390703" }, { "step": 1573, "loss": 0.8606040477752686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.476874" }, { "step": 1574, "loss": 1.10761559009552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.613761" }, { "step": 1575, "loss": 0.88626629114151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.702704" }, { "step": 1576, "loss": 0.573982834815979, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.794340" }, { "step": 1577, "loss": 0.7323048710823059, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.878319" }, { "step": 1578, "loss": 0.7683476209640503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:40.987168" }, { "step": 1579, "loss": 0.7403141260147095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.105766" }, { "step": 1580, "loss": 0.7244820594787598, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.203606" }, { "step": 1581, "loss": 1.215350866317749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.298666" }, { "step": 1582, "loss": 0.9002470970153809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.386670" }, { "step": 1583, "loss": 0.6834888458251953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.481631" }, { "step": 1584, "loss": 0.9782949686050415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.568616" }, { "step": 1585, "loss": 0.6823564767837524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.684086" }, { "step": 1586, "loss": 0.8979634046554565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.770972" }, { "step": 1587, "loss": 0.7908042669296265, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.883187" }, { "step": 1588, "loss": 0.8356561660766602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:41.976115" }, { "step": 1589, "loss": 0.6399887204170227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.078692" }, { "step": 1590, "loss": 0.7164868712425232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.165716" }, { "step": 1591, "loss": 0.5829732418060303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.251092" }, { "step": 1592, "loss": 0.6405943632125854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.352125" }, { "step": 1593, "loss": 1.1882487535476685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.447381" }, { "step": 1594, "loss": 0.6328670382499695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.529959" }, { "step": 1595, "loss": 0.8694331645965576, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.623782" }, { "step": 1596, "loss": 0.5960484147071838, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.719164" }, { "step": 1597, "loss": 0.6961273550987244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.811460" }, { "step": 1598, "loss": 0.8560866117477417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.905192" }, { "step": 1599, "loss": 0.8304780721664429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:42.999560" }, { "step": 1600, "loss": 1.0559648275375366, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.085595" }, { "step": 1601, "loss": 0.6326951384544373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.180168" }, { "step": 1602, "loss": 1.1583244800567627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.266801" }, { "step": 1603, "loss": 0.686031699180603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.364094" }, { "step": 1604, "loss": 0.7291079759597778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.449039" }, { "step": 1605, "loss": 0.628980278968811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.561037" }, { "step": 1606, "loss": 0.9625290632247925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.645595" }, { "step": 1607, "loss": 0.6895248889923096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.735712" }, { "step": 1608, "loss": 0.8885202407836914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.848413" }, { "step": 1609, "loss": 0.654343843460083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:43.940989" }, { "step": 1610, "loss": 0.5195720195770264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.043169" }, { "step": 1611, "loss": 0.8236004114151001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.128432" }, { "step": 1612, "loss": 0.8457984328269958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.213014" }, { "step": 1613, "loss": 0.6437051296234131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.298545" }, { "step": 1614, "loss": 0.4065866470336914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.394497" }, { "step": 1615, "loss": 0.7834150791168213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.482573" }, { "step": 1616, "loss": 0.6846850514411926, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.570368" }, { "step": 1617, "loss": 0.6752805113792419, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.699292" }, { "step": 1618, "loss": 0.7441267371177673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.817487" }, { "step": 1619, "loss": 0.9107120037078857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:44.957243" }, { "step": 1620, "loss": 0.848953127861023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.048937" }, { "step": 1621, "loss": 0.7264012098312378, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.135699" }, { "step": 1622, "loss": 0.8134735226631165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.231103" }, { "step": 1623, "loss": 0.9396449327468872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.355417" }, { "step": 1624, "loss": 0.5515403747558594, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.448322" }, { "step": 1625, "loss": 0.42573073506355286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.542185" }, { "step": 1626, "loss": 0.5851984620094299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.627138" }, { "step": 1627, "loss": 0.7242912650108337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.730682" }, { "step": 1628, "loss": 0.9053226709365845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.838908" }, { "step": 1629, "loss": 0.778213620185852, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:45.931182" }, { "step": 1630, "loss": 1.1150093078613281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.013594" }, { "step": 1631, "loss": 0.6811994314193726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.106186" }, { "step": 1632, "loss": 0.7425647974014282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.192054" }, { "step": 1633, "loss": 1.042852759361267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.287206" }, { "step": 1634, "loss": 0.622652530670166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.374322" }, { "step": 1635, "loss": 0.903398871421814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.459337" }, { "step": 1636, "loss": 0.4199828803539276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.550663" }, { "step": 1637, "loss": 0.659588634967804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.641541" }, { "step": 1638, "loss": 0.8658040761947632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.727857" }, { "step": 1639, "loss": 1.1394671201705933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.823055" }, { "step": 1640, "loss": 0.8732571005821228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:46.945468" }, { "step": 1641, "loss": 1.2527072429656982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.056726" }, { "step": 1642, "loss": 0.5483340620994568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.156540" }, { "step": 1643, "loss": 0.6040744781494141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.251930" }, { "step": 1644, "loss": 0.6814457178115845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.345387" }, { "step": 1645, "loss": 0.6035465598106384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.432374" }, { "step": 1646, "loss": 0.7392975091934204, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.525410" }, { "step": 1647, "loss": 0.770897388458252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.618463" }, { "step": 1648, "loss": 0.9180290699005127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.709711" }, { "step": 1649, "loss": 0.7463035583496094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.828125" }, { "step": 1650, "loss": 0.7210016846656799, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:47.913550" }, { "step": 1651, "loss": 0.9486218690872192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.000224" }, { "step": 1652, "loss": 0.7463973760604858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.096207" }, { "step": 1653, "loss": 0.780491292476654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.186652" }, { "step": 1654, "loss": 0.8214916586875916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.274918" }, { "step": 1655, "loss": 0.4835592806339264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.373506" }, { "step": 1656, "loss": 0.9692674875259399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.461398" }, { "step": 1657, "loss": 0.5806229710578918, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.557791" }, { "step": 1658, "loss": 1.1792134046554565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.674776" }, { "step": 1659, "loss": 0.8327691555023193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.795186" }, { "step": 1660, "loss": 0.9207766056060791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:48.906533" }, { "step": 1661, "loss": 1.1395450830459595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.022077" }, { "step": 1662, "loss": 0.710971474647522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.108664" }, { "step": 1663, "loss": 0.6799346208572388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.193480" }, { "step": 1664, "loss": 0.8805389404296875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.310530" }, { "step": 1665, "loss": 1.1726839542388916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.400616" }, { "step": 1666, "loss": 0.48349088430404663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.493385" }, { "step": 1667, "loss": 0.944056510925293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.595126" }, { "step": 1668, "loss": 0.6913616061210632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.716524" }, { "step": 1669, "loss": 0.6528617143630981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.801678" }, { "step": 1670, "loss": 0.8860700130462646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.899091" }, { "step": 1671, "loss": 0.639069676399231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:49.992975" }, { "step": 1672, "loss": 0.8550063371658325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.107937" }, { "step": 1673, "loss": 0.7596286535263062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.194092" }, { "step": 1674, "loss": 0.7663513422012329, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.290998" }, { "step": 1675, "loss": 0.7850126624107361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.389288" }, { "step": 1676, "loss": 0.8487158417701721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.473734" }, { "step": 1677, "loss": 0.5116404294967651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.564164" }, { "step": 1678, "loss": 0.9032230973243713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.656803" }, { "step": 1679, "loss": 0.5591224431991577, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.748577" }, { "step": 1680, "loss": 0.5866772532463074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.834470" }, { "step": 1681, "loss": 0.4728408455848694, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:50.928139" }, { "step": 1682, "loss": 0.7105615735054016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.020585" }, { "step": 1683, "loss": 0.4887215197086334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.116110" }, { "step": 1684, "loss": 0.9512892365455627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.208094" }, { "step": 1685, "loss": 0.6274917721748352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.306376" }, { "step": 1686, "loss": 0.9147731065750122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.421297" }, { "step": 1687, "loss": 0.4085814952850342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.507663" }, { "step": 1688, "loss": 0.9438515305519104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.613531" }, { "step": 1689, "loss": 0.9555404186248779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.733084" }, { "step": 1690, "loss": 0.9925236701965332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.819261" }, { "step": 1691, "loss": 0.499704509973526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:51.908427" }, { "step": 1692, "loss": 0.8120027780532837, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.032506" }, { "step": 1693, "loss": 0.6869354844093323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.125710" }, { "step": 1694, "loss": 0.8656712770462036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.235826" }, { "step": 1695, "loss": 1.0533676147460938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.332834" }, { "step": 1696, "loss": 1.3578035831451416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.424228" }, { "step": 1697, "loss": 0.715682864189148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.520013" }, { "step": 1698, "loss": 0.7085258960723877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.604842" }, { "step": 1699, "loss": 0.6702102422714233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.690709" }, { "step": 1700, "loss": 0.6776799559593201, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.776120" }, { "step": 1701, "loss": 1.0066267251968384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.864483" }, { "step": 1702, "loss": 0.5106871724128723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:52.958851" }, { "step": 1703, "loss": 0.7695677280426025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.078872" }, { "step": 1704, "loss": 1.0554074048995972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.196303" }, { "step": 1705, "loss": 1.1048004627227783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.303864" }, { "step": 1706, "loss": 0.9171622395515442, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.413580" }, { "step": 1707, "loss": 0.9776779413223267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.502960" }, { "step": 1708, "loss": 0.7974017858505249, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.598235" }, { "step": 1709, "loss": 0.5222417116165161, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.690778" }, { "step": 1710, "loss": 1.00734543800354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.785997" }, { "step": 1711, "loss": 0.9647928476333618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:53.896534" }, { "step": 1712, "loss": 1.0354390144348145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.034051" }, { "step": 1713, "loss": 0.8584238290786743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.147589" }, { "step": 1714, "loss": 0.8834152221679688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.259159" }, { "step": 1715, "loss": 1.1813910007476807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.344258" }, { "step": 1716, "loss": 0.530284583568573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.437522" }, { "step": 1717, "loss": 0.8683257102966309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.522143" }, { "step": 1718, "loss": 0.7007846236228943, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.607326" }, { "step": 1719, "loss": 0.557866632938385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.694895" }, { "step": 1720, "loss": 0.98589688539505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.807898" }, { "step": 1721, "loss": 0.6633203029632568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.898442" }, { "step": 1722, "loss": 0.542639970779419, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:54.983891" }, { "step": 1723, "loss": 0.646965503692627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.077313" }, { "step": 1724, "loss": 1.076069951057434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.215720" }, { "step": 1725, "loss": 0.5733832120895386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.305245" }, { "step": 1726, "loss": 0.774743914604187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.414877" }, { "step": 1727, "loss": 0.3979939818382263, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.502113" }, { "step": 1728, "loss": 1.1056227684020996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.615932" }, { "step": 1729, "loss": 0.700261652469635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.704699" }, { "step": 1730, "loss": 0.7036036252975464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.797336" }, { "step": 1731, "loss": 0.7633544206619263, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.882326" }, { "step": 1732, "loss": 0.6831862926483154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:55.967790" }, { "step": 1733, "loss": 0.9476801156997681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.082564" }, { "step": 1734, "loss": 0.8716806769371033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.180594" }, { "step": 1735, "loss": 0.6110721826553345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.267017" }, { "step": 1736, "loss": 0.9853053092956543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.352577" }, { "step": 1737, "loss": 0.38925305008888245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.437340" }, { "step": 1738, "loss": 1.002710223197937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.568564" }, { "step": 1739, "loss": 0.9119391441345215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.654087" }, { "step": 1740, "loss": 0.5883725881576538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.753413" }, { "step": 1741, "loss": 0.607384204864502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.843618" }, { "step": 1742, "loss": 0.8617742657661438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:56.936654" }, { "step": 1743, "loss": 0.7097076773643494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.026394" }, { "step": 1744, "loss": 0.49533212184906006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.119540" }, { "step": 1745, "loss": 0.9483170509338379, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.237691" }, { "step": 1746, "loss": 0.8691346049308777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.329955" }, { "step": 1747, "loss": 0.5861386060714722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.426592" }, { "step": 1748, "loss": 1.1365867853164673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.532328" }, { "step": 1749, "loss": 1.152987003326416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.646925" }, { "step": 1750, "loss": 0.8631788492202759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.732729" }, { "step": 1751, "loss": 1.2884870767593384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.821620" }, { "step": 1752, "loss": 0.7970128655433655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:57.906737" }, { "step": 1753, "loss": 0.505620002746582, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.011448" }, { "step": 1754, "loss": 0.49528926610946655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.107430" }, { "step": 1755, "loss": 0.66327965259552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.199446" }, { "step": 1756, "loss": 0.8817498683929443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.312729" }, { "step": 1757, "loss": 0.8818161487579346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.423613" }, { "step": 1758, "loss": 0.856137216091156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.510515" }, { "step": 1759, "loss": 0.9136111736297607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.598257" }, { "step": 1760, "loss": 0.9978796243667603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.701725" }, { "step": 1761, "loss": 0.7763382196426392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.788404" }, { "step": 1762, "loss": 0.7573778033256531, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.882630" }, { "step": 1763, "loss": 0.9834239482879639, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:58.995032" }, { "step": 1764, "loss": 0.9716619253158569, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.090426" }, { "step": 1765, "loss": 1.008638620376587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.202312" }, { "step": 1766, "loss": 0.7643083930015564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.294715" }, { "step": 1767, "loss": 0.8467000722885132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.409458" }, { "step": 1768, "loss": 0.7824146151542664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.503607" }, { "step": 1769, "loss": 0.9416370391845703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.615878" }, { "step": 1770, "loss": 0.6026697754859924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.739544" }, { "step": 1771, "loss": 0.6737789511680603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.831900" }, { "step": 1772, "loss": 0.4737197756767273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:26:59.922188" }, { "step": 1773, "loss": 0.5306640863418579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.012411" }, { "step": 1774, "loss": 0.9374620914459229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.107869" }, { "step": 1775, "loss": 0.8617485165596008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.192384" }, { "step": 1776, "loss": 0.7807355523109436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.278283" }, { "step": 1777, "loss": 0.49240440130233765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.370689" }, { "step": 1778, "loss": 0.5823877453804016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.467122" }, { "step": 1779, "loss": 0.62892085313797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.552849" }, { "step": 1780, "loss": 0.6780792474746704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.646742" }, { "step": 1781, "loss": 1.119220495223999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.766247" }, { "step": 1782, "loss": 0.6864781379699707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.853315" }, { "step": 1783, "loss": 0.4659025967121124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:00.945591" }, { "step": 1784, "loss": 0.5828922390937805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.033704" }, { "step": 1785, "loss": 0.823110818862915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.119877" }, { "step": 1786, "loss": 0.7622283697128296, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.204900" }, { "step": 1787, "loss": 0.5225710868835449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.290955" }, { "step": 1788, "loss": 0.7888858914375305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.383183" }, { "step": 1789, "loss": 0.5717642307281494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.472376" }, { "step": 1790, "loss": 0.8344401121139526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.564118" }, { "step": 1791, "loss": 0.937287449836731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.656973" }, { "step": 1792, "loss": 0.5000914931297302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.749545" }, { "step": 1793, "loss": 0.4631006121635437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.840846" }, { "step": 1794, "loss": 0.4942971467971802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:01.935245" }, { "step": 1795, "loss": 1.1497340202331543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.032905" }, { "step": 1796, "loss": 0.47933948040008545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.118660" }, { "step": 1797, "loss": 0.5815085172653198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.209101" }, { "step": 1798, "loss": 0.49563950300216675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.294565" }, { "step": 1799, "loss": 0.8669488430023193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.380399" }, { "step": 1800, "loss": 0.7496854066848755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.469766" }, { "step": 1801, "loss": 0.7192082405090332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.561947" }, { "step": 1802, "loss": 0.8468202352523804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.680835" }, { "step": 1803, "loss": 0.45935508608818054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.773352" }, { "step": 1804, "loss": 0.746845006942749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.886481" }, { "step": 1805, "loss": 1.1259496212005615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:02.999590" }, { "step": 1806, "loss": 0.9907668828964233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.116862" }, { "step": 1807, "loss": 1.0750583410263062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.225554" }, { "step": 1808, "loss": 0.7720011472702026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.342795" }, { "step": 1809, "loss": 0.6590583324432373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.441234" }, { "step": 1810, "loss": 0.77104252576828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.534066" }, { "step": 1811, "loss": 0.7433466911315918, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.630896" }, { "step": 1812, "loss": 0.5872305035591125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.723505" }, { "step": 1813, "loss": 0.6861262321472168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.807688" }, { "step": 1814, "loss": 0.7994439601898193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.902618" }, { "step": 1815, "loss": 0.5702865719795227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:03.997201" }, { "step": 1816, "loss": 0.8381694555282593, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.088218" }, { "step": 1817, "loss": 0.6543471217155457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.207616" }, { "step": 1818, "loss": 1.0083260536193848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.324768" }, { "step": 1819, "loss": 0.8269699811935425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.415649" }, { "step": 1820, "loss": 1.0031217336654663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.506154" }, { "step": 1821, "loss": 0.5848889946937561, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.599955" }, { "step": 1822, "loss": 1.0898303985595703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.700633" }, { "step": 1823, "loss": 0.6521490216255188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.795438" }, { "step": 1824, "loss": 0.5647448897361755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:04.908761" }, { "step": 1825, "loss": 0.8086777329444885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.022525" }, { "step": 1826, "loss": 1.0061997175216675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.121192" }, { "step": 1827, "loss": 0.9253878593444824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.229394" }, { "step": 1828, "loss": 0.8325805068016052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.372759" }, { "step": 1829, "loss": 0.6689059734344482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.457946" }, { "step": 1830, "loss": 0.5631651878356934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.573869" }, { "step": 1831, "loss": 1.4111907482147217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.660020" }, { "step": 1832, "loss": 0.927198588848114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.753084" }, { "step": 1833, "loss": 0.5101783871650696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.837800" }, { "step": 1834, "loss": 0.8698747158050537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:05.960136" }, { "step": 1835, "loss": 0.5173764228820801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.045995" }, { "step": 1836, "loss": 0.8246023654937744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.161595" }, { "step": 1837, "loss": 0.933089017868042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.270906" }, { "step": 1838, "loss": 0.7520145177841187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.355885" }, { "step": 1839, "loss": 0.7937530279159546, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.442134" }, { "step": 1840, "loss": 0.9424737095832825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.546024" }, { "step": 1841, "loss": 0.7017821073532104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.663279" }, { "step": 1842, "loss": 0.7552847862243652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.758593" }, { "step": 1843, "loss": 0.555665910243988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.849575" }, { "step": 1844, "loss": 0.48038357496261597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:06.944853" }, { "step": 1845, "loss": 0.7498619556427002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.037043" }, { "step": 1846, "loss": 0.6364915370941162, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.132370" }, { "step": 1847, "loss": 0.8513547778129578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.217350" }, { "step": 1848, "loss": 0.8519651889801025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.309266" }, { "step": 1849, "loss": 1.0298044681549072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.403358" }, { "step": 1850, "loss": 0.9284107685089111, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.525206" }, { "step": 1851, "loss": 0.501100480556488, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.611921" }, { "step": 1852, "loss": 0.5783929228782654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.697925" }, { "step": 1853, "loss": 0.866767168045044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.786499" }, { "step": 1854, "loss": 1.0762834548950195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.873065" }, { "step": 1855, "loss": 0.5726102590560913, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:07.957877" }, { "step": 1856, "loss": 1.1122097969055176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.067346" }, { "step": 1857, "loss": 0.8702807426452637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.153348" }, { "step": 1858, "loss": 0.8441775441169739, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.265564" }, { "step": 1859, "loss": 0.6987736225128174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.353878" }, { "step": 1860, "loss": 0.7678226232528687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.447896" }, { "step": 1861, "loss": 0.48547816276550293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.535062" }, { "step": 1862, "loss": 0.9926657676696777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.639056" }, { "step": 1863, "loss": 0.8456896543502808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.723764" }, { "step": 1864, "loss": 0.8266201019287109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.838506" }, { "step": 1865, "loss": 0.4656114876270294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:08.924067" }, { "step": 1866, "loss": 0.4979897141456604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.015632" }, { "step": 1867, "loss": 0.6560565829277039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.108036" }, { "step": 1868, "loss": 0.8896043300628662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.193587" }, { "step": 1869, "loss": 0.8859495520591736, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.278640" }, { "step": 1870, "loss": 0.5234035849571228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.367081" }, { "step": 1871, "loss": 0.5119367241859436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.461426" }, { "step": 1872, "loss": 0.28662678599357605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.557384" }, { "step": 1873, "loss": 0.9281425476074219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.642631" }, { "step": 1874, "loss": 0.7509031891822815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.753661" }, { "step": 1875, "loss": 0.7369124293327332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.855207" }, { "step": 1876, "loss": 0.40913575887680054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:09.940368" }, { "step": 1877, "loss": 0.6345843076705933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.038414" }, { "step": 1878, "loss": 1.1139532327651978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.150590" }, { "step": 1879, "loss": 0.4211101531982422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.246213" }, { "step": 1880, "loss": 0.7771605849266052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.337339" }, { "step": 1881, "loss": 1.0112638473510742, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.431952" }, { "step": 1882, "loss": 1.0529471635818481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.542195" }, { "step": 1883, "loss": 0.873255729675293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.628756" }, { "step": 1884, "loss": 0.744253396987915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.714511" }, { "step": 1885, "loss": 0.96895432472229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.835932" }, { "step": 1886, "loss": 0.9584499001502991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:10.936757" }, { "step": 1887, "loss": 0.7388558387756348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.026520" }, { "step": 1888, "loss": 0.9128726720809937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.112020" }, { "step": 1889, "loss": 0.9965624809265137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.196347" }, { "step": 1890, "loss": 0.6124939918518066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.283887" }, { "step": 1891, "loss": 1.0247478485107422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.371644" }, { "step": 1892, "loss": 0.6131253838539124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.458080" }, { "step": 1893, "loss": 1.0312659740447998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.545663" }, { "step": 1894, "loss": 0.9801608920097351, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.656300" }, { "step": 1895, "loss": 0.7698161602020264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.764329" }, { "step": 1896, "loss": 0.6428829431533813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.857372" }, { "step": 1897, "loss": 1.0154932737350464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:11.964848" }, { "step": 1898, "loss": 0.7801030874252319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.049398" }, { "step": 1899, "loss": 0.5553430914878845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.149311" }, { "step": 1900, "loss": 0.5887404680252075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.243892" }, { "step": 1901, "loss": 0.6570307016372681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.328858" }, { "step": 1902, "loss": 0.9952781796455383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.418036" }, { "step": 1903, "loss": 0.9754607081413269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.536185" }, { "step": 1904, "loss": 0.7709250450134277, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.621305" }, { "step": 1905, "loss": 0.77546226978302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.707980" }, { "step": 1906, "loss": 0.7188384532928467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.826991" }, { "step": 1907, "loss": 0.6045461893081665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:12.919650" }, { "step": 1908, "loss": 0.8227835297584534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.008116" }, { "step": 1909, "loss": 0.6920571327209473, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.126633" }, { "step": 1910, "loss": 0.4282805323600769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.214615" }, { "step": 1911, "loss": 1.0521128177642822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.327954" }, { "step": 1912, "loss": 0.6239827275276184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.430037" }, { "step": 1913, "loss": 0.675784707069397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.524909" }, { "step": 1914, "loss": 1.1308202743530273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.614573" }, { "step": 1915, "loss": 0.7930194139480591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.725102" }, { "step": 1916, "loss": 0.5585340857505798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.819170" }, { "step": 1917, "loss": 0.8877888917922974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:13.954250" }, { "step": 1918, "loss": 1.167547583580017, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.051656" }, { "step": 1919, "loss": 0.9106568694114685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.147741" }, { "step": 1920, "loss": 0.800535261631012, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.264902" }, { "step": 1921, "loss": 0.7520840764045715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.358449" }, { "step": 1922, "loss": 0.7552651762962341, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.447347" }, { "step": 1923, "loss": 0.4641299247741699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.534037" }, { "step": 1924, "loss": 0.9257285594940186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.635078" }, { "step": 1925, "loss": 0.8224716186523438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.744809" }, { "step": 1926, "loss": 1.0898398160934448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.863299" }, { "step": 1927, "loss": 0.7924581170082092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:14.956359" }, { "step": 1928, "loss": 0.6222105026245117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.053759" }, { "step": 1929, "loss": 0.6578580141067505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.145316" }, { "step": 1930, "loss": 0.9247274398803711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.244472" }, { "step": 1931, "loss": 0.7395702600479126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.356537" }, { "step": 1932, "loss": 0.6228796243667603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.443498" }, { "step": 1933, "loss": 0.8714454770088196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.536701" }, { "step": 1934, "loss": 0.5526946187019348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.629124" }, { "step": 1935, "loss": 0.5159721374511719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.727023" }, { "step": 1936, "loss": 0.891792893409729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.821746" }, { "step": 1937, "loss": 0.6722465753555298, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:15.917580" }, { "step": 1938, "loss": 0.4797954261302948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.010155" }, { "step": 1939, "loss": 1.057007074356079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.093021" }, { "step": 1940, "loss": 1.4015158414840698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.179802" }, { "step": 1941, "loss": 0.9476916193962097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.290356" }, { "step": 1942, "loss": 0.4910714626312256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.384284" }, { "step": 1943, "loss": 0.44559869170188904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.470803" }, { "step": 1944, "loss": 0.6030001044273376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.592366" }, { "step": 1945, "loss": 0.6753707528114319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.687522" }, { "step": 1946, "loss": 0.8787838220596313, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.771184" }, { "step": 1947, "loss": 0.7671337127685547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.861768" }, { "step": 1948, "loss": 1.1945006847381592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:16.947727" }, { "step": 1949, "loss": 0.9443155527114868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.035920" }, { "step": 1950, "loss": 0.6619548201560974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.129053" }, { "step": 1951, "loss": 0.8160449862480164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.216378" }, { "step": 1952, "loss": 0.7852799296379089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.319163" }, { "step": 1953, "loss": 0.9625654220581055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.407241" }, { "step": 1954, "loss": 0.7032355666160583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.490158" }, { "step": 1955, "loss": 0.6822159290313721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.580951" }, { "step": 1956, "loss": 0.6953666806221008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.685906" }, { "step": 1957, "loss": 0.6217108964920044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.782233" }, { "step": 1958, "loss": 0.5208332538604736, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.867320" }, { "step": 1959, "loss": 0.6080406904220581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:17.955245" }, { "step": 1960, "loss": 0.5748878717422485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.046217" }, { "step": 1961, "loss": 0.8010828495025635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.159347" }, { "step": 1962, "loss": 0.822622537612915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.252383" }, { "step": 1963, "loss": 0.591983437538147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.342526" }, { "step": 1964, "loss": 0.8100687861442566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.456473" }, { "step": 1965, "loss": 1.2616339921951294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.540861" }, { "step": 1966, "loss": 0.4129089117050171, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.633286" }, { "step": 1967, "loss": 0.8072668313980103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.721219" }, { "step": 1968, "loss": 0.9316155314445496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.808537" }, { "step": 1969, "loss": 0.9009596109390259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:18.930297" }, { "step": 1970, "loss": 0.7634180188179016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.017417" }, { "step": 1971, "loss": 0.7224233150482178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.110588" }, { "step": 1972, "loss": 0.5351408123970032, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.240075" }, { "step": 1973, "loss": 0.6618126630783081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.332720" }, { "step": 1974, "loss": 0.8647774457931519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.439063" }, { "step": 1975, "loss": 1.0798931121826172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.524481" }, { "step": 1976, "loss": 0.5879663228988647, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.610338" }, { "step": 1977, "loss": 0.8216493129730225, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.726412" }, { "step": 1978, "loss": 0.7521553039550781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.819913" }, { "step": 1979, "loss": 1.0475980043411255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:19.927018" }, { "step": 1980, "loss": 0.5756022930145264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.016424" }, { "step": 1981, "loss": 0.512327253818512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.104834" }, { "step": 1982, "loss": 1.0056967735290527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.214408" }, { "step": 1983, "loss": 1.0527366399765015, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.325869" }, { "step": 1984, "loss": 0.4754277467727661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.412466" }, { "step": 1985, "loss": 0.7219148278236389, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.499656" }, { "step": 1986, "loss": 0.7799282670021057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.590323" }, { "step": 1987, "loss": 0.5784151554107666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.681991" }, { "step": 1988, "loss": 0.7918798923492432, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.774333" }, { "step": 1989, "loss": 0.5772669315338135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.872089" }, { "step": 1990, "loss": 0.8480250835418701, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:20.958548" }, { "step": 1991, "loss": 0.9738643169403076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.055441" }, { "step": 1992, "loss": 0.29701071977615356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.140883" }, { "step": 1993, "loss": 0.6756932735443115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.226206" }, { "step": 1994, "loss": 0.8952434062957764, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.319828" }, { "step": 1995, "loss": 0.7170482277870178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.431913" }, { "step": 1996, "loss": 0.7582149505615234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.524140" }, { "step": 1997, "loss": 1.1852198839187622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.609162" }, { "step": 1998, "loss": 0.6584182977676392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.727526" }, { "step": 1999, "loss": 0.811110258102417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.816342" }, { "step": 2000, "loss": 0.8418666124343872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:21.925592" }, { "step": 2001, "loss": 0.5327990055084229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:44.912951" }, { "step": 2002, "loss": 0.7475180625915527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.001131" }, { "step": 2003, "loss": 0.8749673962593079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.087687" }, { "step": 2004, "loss": 1.1086535453796387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.201122" }, { "step": 2005, "loss": 1.1150469779968262, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.318251" }, { "step": 2006, "loss": 0.7147820591926575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.407108" }, { "step": 2007, "loss": 0.5765021443367004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.496713" }, { "step": 2008, "loss": 0.9027854204177856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.581921" }, { "step": 2009, "loss": 0.6244751214981079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.681503" }, { "step": 2010, "loss": 0.861250638961792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.767788" }, { "step": 2011, "loss": 0.9899379014968872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.852812" }, { "step": 2012, "loss": 0.775721549987793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:45.940365" }, { "step": 2013, "loss": 0.6310442090034485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.060392" }, { "step": 2014, "loss": 0.9116814732551575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.179061" }, { "step": 2015, "loss": 0.7557075619697571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.268560" }, { "step": 2016, "loss": 0.5977158546447754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.358690" }, { "step": 2017, "loss": 0.5623772144317627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.450561" }, { "step": 2018, "loss": 0.6577892899513245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.547765" }, { "step": 2019, "loss": 0.5260482430458069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.641869" }, { "step": 2020, "loss": 0.9261269569396973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.756895" }, { "step": 2021, "loss": 0.8329193592071533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.850629" }, { "step": 2022, "loss": 1.080298662185669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:46.967757" }, { "step": 2023, "loss": 0.8774429559707642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.083518" }, { "step": 2024, "loss": 0.3868868350982666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.177088" }, { "step": 2025, "loss": 0.6322320103645325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.273342" }, { "step": 2026, "loss": 0.747350811958313, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.365995" }, { "step": 2027, "loss": 0.7900892496109009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.459440" }, { "step": 2028, "loss": 0.6939447522163391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.548034" }, { "step": 2029, "loss": 0.8595272898674011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.632886" }, { "step": 2030, "loss": 0.46658623218536377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.717807" }, { "step": 2031, "loss": 1.1152490377426147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.806210" }, { "step": 2032, "loss": 0.9112299680709839, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:47.912555" }, { "step": 2033, "loss": 1.0627232789993286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.027609" }, { "step": 2034, "loss": 0.6772646903991699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.133136" }, { "step": 2035, "loss": 0.8445037603378296, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.226567" }, { "step": 2036, "loss": 0.784016489982605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.311507" }, { "step": 2037, "loss": 0.6405957937240601, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.397852" }, { "step": 2038, "loss": 0.6325603723526001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.493733" }, { "step": 2039, "loss": 0.8544020652770996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.588560" }, { "step": 2040, "loss": 0.851189136505127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.680323" }, { "step": 2041, "loss": 0.7705767154693604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.774520" }, { "step": 2042, "loss": 0.6034852266311646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.875921" }, { "step": 2043, "loss": 1.1980056762695312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:48.961294" }, { "step": 2044, "loss": 0.791743278503418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.052709" }, { "step": 2045, "loss": 0.809790849685669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.174535" }, { "step": 2046, "loss": 0.7527389526367188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.264035" }, { "step": 2047, "loss": 0.48082292079925537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.350164" }, { "step": 2048, "loss": 0.9297913312911987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.435911" }, { "step": 2049, "loss": 0.8382928967475891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.531529" }, { "step": 2050, "loss": 0.7008343935012817, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.644954" }, { "step": 2051, "loss": 0.7494572401046753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.731199" }, { "step": 2052, "loss": 0.6800843477249146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.824505" }, { "step": 2053, "loss": 1.076270580291748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:49.916529" }, { "step": 2054, "loss": 1.034283995628357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.005543" }, { "step": 2055, "loss": 0.5453467965126038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.097362" }, { "step": 2056, "loss": 0.6139431595802307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.184632" }, { "step": 2057, "loss": 0.7131550312042236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.269723" }, { "step": 2058, "loss": 0.672147274017334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.364849" }, { "step": 2059, "loss": 0.7885032892227173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.485267" }, { "step": 2060, "loss": 0.9244424104690552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.622738" }, { "step": 2061, "loss": 0.5237529277801514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.707659" }, { "step": 2062, "loss": 0.9487952589988708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.800809" }, { "step": 2063, "loss": 0.5140902996063232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.892874" }, { "step": 2064, "loss": 0.8160005807876587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:50.981277" }, { "step": 2065, "loss": 0.906071126461029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.068782" }, { "step": 2066, "loss": 1.0516114234924316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.179687" }, { "step": 2067, "loss": 1.0079174041748047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.289006" }, { "step": 2068, "loss": 1.0717167854309082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.386975" }, { "step": 2069, "loss": 0.7504427433013916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.492372" }, { "step": 2070, "loss": 0.7269868850708008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.585862" }, { "step": 2071, "loss": 0.8221076726913452, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.673153" }, { "step": 2072, "loss": 0.45040684938430786, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.763448" }, { "step": 2073, "loss": 1.1505159139633179, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.850290" }, { "step": 2074, "loss": 0.5650702714920044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:51.969587" }, { "step": 2075, "loss": 0.7258095741271973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.055097" }, { "step": 2076, "loss": 0.9384150505065918, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.152925" }, { "step": 2077, "loss": 0.7584865689277649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.292047" }, { "step": 2078, "loss": 0.6355594992637634, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.380627" }, { "step": 2079, "loss": 0.6570427417755127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.471120" }, { "step": 2080, "loss": 0.8679275512695312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.565003" }, { "step": 2081, "loss": 0.9052442908287048, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.698160" }, { "step": 2082, "loss": 0.8012522459030151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.791396" }, { "step": 2083, "loss": 0.9728863835334778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.875830" }, { "step": 2084, "loss": 0.3625098466873169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:52.961859" }, { "step": 2085, "loss": 0.6949154138565063, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.046669" }, { "step": 2086, "loss": 0.741844892501831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.156897" }, { "step": 2087, "loss": 0.5587087869644165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.239651" }, { "step": 2088, "loss": 1.085228443145752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.324563" }, { "step": 2089, "loss": 0.7781505584716797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.414566" }, { "step": 2090, "loss": 0.9970237016677856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.508441" }, { "step": 2091, "loss": 0.7722925543785095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.601593" }, { "step": 2092, "loss": 0.578615128993988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.687179" }, { "step": 2093, "loss": 0.6671923398971558, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.779450" }, { "step": 2094, "loss": 0.703940749168396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.881809" }, { "step": 2095, "loss": 1.1990106105804443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:53.995928" }, { "step": 2096, "loss": 0.4779035449028015, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.086591" }, { "step": 2097, "loss": 0.7698163986206055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.178952" }, { "step": 2098, "loss": 1.010088324546814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.319670" }, { "step": 2099, "loss": 0.4070402979850769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.417292" }, { "step": 2100, "loss": 0.7160179018974304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.504652" }, { "step": 2101, "loss": 0.8096165657043457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.610601" }, { "step": 2102, "loss": 0.7915735840797424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.707473" }, { "step": 2103, "loss": 0.9250328540802002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.829253" }, { "step": 2104, "loss": 0.885496973991394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:54.917755" }, { "step": 2105, "loss": 0.6748918294906616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.011522" }, { "step": 2106, "loss": 0.675432026386261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.104502" }, { "step": 2107, "loss": 0.8798873424530029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.193503" }, { "step": 2108, "loss": 0.7944731712341309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.288276" }, { "step": 2109, "loss": 0.7451233863830566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.372263" }, { "step": 2110, "loss": 0.4473828673362732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.457563" }, { "step": 2111, "loss": 0.5502047538757324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.549918" }, { "step": 2112, "loss": 0.7394700050354004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.642480" }, { "step": 2113, "loss": 0.29510030150413513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.728232" }, { "step": 2114, "loss": 0.5971872806549072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.812461" }, { "step": 2115, "loss": 0.7589570879936218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:55.924516" }, { "step": 2116, "loss": 0.6909990310668945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.009788" }, { "step": 2117, "loss": 0.7764163017272949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.103684" }, { "step": 2118, "loss": 0.6614155769348145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.193144" }, { "step": 2119, "loss": 0.6113893985748291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.282949" }, { "step": 2120, "loss": 0.759284257888794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.369814" }, { "step": 2121, "loss": 0.7434566617012024, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.455449" }, { "step": 2122, "loss": 0.7878098487854004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.573707" }, { "step": 2123, "loss": 1.0899617671966553, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.669037" }, { "step": 2124, "loss": 0.6030062437057495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.769235" }, { "step": 2125, "loss": 1.0014410018920898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.864187" }, { "step": 2126, "loss": 1.0367460250854492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:56.976464" }, { "step": 2127, "loss": 0.6560336947441101, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.067440" }, { "step": 2128, "loss": 0.7706923484802246, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.151860" }, { "step": 2129, "loss": 0.7819386720657349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.243797" }, { "step": 2130, "loss": 0.710226833820343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.334731" }, { "step": 2131, "loss": 1.0756052732467651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.434575" }, { "step": 2132, "loss": 0.725184977054596, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.531129" }, { "step": 2133, "loss": 0.5976231098175049, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.625676" }, { "step": 2134, "loss": 0.9360681772232056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.711866" }, { "step": 2135, "loss": 0.46644508838653564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.801479" }, { "step": 2136, "loss": 0.4403388202190399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:57.891593" }, { "step": 2137, "loss": 1.1091973781585693, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.003109" }, { "step": 2138, "loss": 0.8626742959022522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.093937" }, { "step": 2139, "loss": 1.0000176429748535, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.183770" }, { "step": 2140, "loss": 0.5084090828895569, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.270432" }, { "step": 2141, "loss": 0.8802869319915771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.371151" }, { "step": 2142, "loss": 0.8684374094009399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.487149" }, { "step": 2143, "loss": 0.5750052332878113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.578345" }, { "step": 2144, "loss": 0.8629574179649353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.663755" }, { "step": 2145, "loss": 0.6888532042503357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.756039" }, { "step": 2146, "loss": 0.6112690567970276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.848564" }, { "step": 2147, "loss": 0.5765454769134521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:58.935387" }, { "step": 2148, "loss": 0.6824730038642883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.027016" }, { "step": 2149, "loss": 1.0703377723693848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.161687" }, { "step": 2150, "loss": 0.7919694185256958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.282169" }, { "step": 2151, "loss": 0.5575411319732666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.377440" }, { "step": 2152, "loss": 0.7918276786804199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.463020" }, { "step": 2153, "loss": 0.6338595747947693, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.563655" }, { "step": 2154, "loss": 0.6149189472198486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.657162" }, { "step": 2155, "loss": 0.7511393427848816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.773546" }, { "step": 2156, "loss": 0.7959324717521667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.857794" }, { "step": 2157, "loss": 0.8319166898727417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:27:59.959472" }, { "step": 2158, "loss": 0.8276342749595642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.048965" }, { "step": 2159, "loss": 0.5605116486549377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.143019" }, { "step": 2160, "loss": 0.9446595907211304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.252810" }, { "step": 2161, "loss": 0.7259869575500488, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.346509" }, { "step": 2162, "loss": 0.5860852003097534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.441847" }, { "step": 2163, "loss": 0.7626826763153076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.549588" }, { "step": 2164, "loss": 0.6047133207321167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.636019" }, { "step": 2165, "loss": 0.9707897901535034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.754069" }, { "step": 2166, "loss": 0.8291369676589966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.850218" }, { "step": 2167, "loss": 0.7278308868408203, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:00.962899" }, { "step": 2168, "loss": 0.7750736474990845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.073139" }, { "step": 2169, "loss": 0.7176913022994995, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.164866" }, { "step": 2170, "loss": 1.07511305809021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.263479" }, { "step": 2171, "loss": 0.37143006920814514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.352794" }, { "step": 2172, "loss": 0.8522204160690308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.440387" }, { "step": 2173, "loss": 0.4966774880886078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.533000" }, { "step": 2174, "loss": 0.5337688326835632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.618351" }, { "step": 2175, "loss": 0.6058633327484131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.707881" }, { "step": 2176, "loss": 0.8226615786552429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.837937" }, { "step": 2177, "loss": 0.6725635528564453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:01.924477" }, { "step": 2178, "loss": 1.1486363410949707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.007293" }, { "step": 2179, "loss": 0.5386438965797424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.097953" }, { "step": 2180, "loss": 0.9573469161987305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.184565" }, { "step": 2181, "loss": 0.9603239893913269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.274687" }, { "step": 2182, "loss": 1.0066797733306885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.388758" }, { "step": 2183, "loss": 1.1811528205871582, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.475265" }, { "step": 2184, "loss": 0.5455707907676697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.559942" }, { "step": 2185, "loss": 0.6785417795181274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.643732" }, { "step": 2186, "loss": 0.8713365793228149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.729201" }, { "step": 2187, "loss": 0.7512391209602356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.842489" }, { "step": 2188, "loss": 0.8678900003433228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:02.930149" }, { "step": 2189, "loss": 0.6475967168807983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.019203" }, { "step": 2190, "loss": 0.7228530049324036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.136201" }, { "step": 2191, "loss": 0.5685636401176453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.231595" }, { "step": 2192, "loss": 0.6682023406028748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.318979" }, { "step": 2193, "loss": 0.7647811770439148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.429881" }, { "step": 2194, "loss": 0.7705960273742676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.522783" }, { "step": 2195, "loss": 0.6103343367576599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.616861" }, { "step": 2196, "loss": 0.9527674913406372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.708402" }, { "step": 2197, "loss": 0.5195720195770264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.808314" }, { "step": 2198, "loss": 0.5516658425331116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.896527" }, { "step": 2199, "loss": 0.906133770942688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:03.989782" }, { "step": 2200, "loss": 0.8090426921844482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.076093" }, { "step": 2201, "loss": 0.8095670938491821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.191235" }, { "step": 2202, "loss": 0.9014479517936707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.276721" }, { "step": 2203, "loss": 0.47529804706573486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.370252" }, { "step": 2204, "loss": 0.5888440012931824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.463228" }, { "step": 2205, "loss": 0.7600259780883789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.549336" }, { "step": 2206, "loss": 0.6884351968765259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.665486" }, { "step": 2207, "loss": 0.8580024838447571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.785406" }, { "step": 2208, "loss": 0.5876350998878479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.870512" }, { "step": 2209, "loss": 0.44177961349487305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:04.962414" }, { "step": 2210, "loss": 0.9948874711990356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.082119" }, { "step": 2211, "loss": 1.2360060214996338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.169244" }, { "step": 2212, "loss": 0.6514761447906494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.260565" }, { "step": 2213, "loss": 0.8941179513931274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.350160" }, { "step": 2214, "loss": 0.8189272880554199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.466290" }, { "step": 2215, "loss": 0.7438778281211853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.584618" }, { "step": 2216, "loss": 0.734805703163147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.712377" }, { "step": 2217, "loss": 0.36497628688812256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.798165" }, { "step": 2218, "loss": 0.6720117926597595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.897213" }, { "step": 2219, "loss": 0.4388832151889801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:05.998190" }, { "step": 2220, "loss": 1.0532678365707397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.108714" }, { "step": 2221, "loss": 0.8904229402542114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.198299" }, { "step": 2222, "loss": 0.7806097269058228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.288255" }, { "step": 2223, "loss": 0.5550211668014526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.390907" }, { "step": 2224, "loss": 0.9466104507446289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.509366" }, { "step": 2225, "loss": 0.3910347819328308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.601537" }, { "step": 2226, "loss": 0.694291353225708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.686674" }, { "step": 2227, "loss": 0.6718630194664001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.774858" }, { "step": 2228, "loss": 0.9928800463676453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.864967" }, { "step": 2229, "loss": 0.5808544158935547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:06.956661" }, { "step": 2230, "loss": 0.7402147054672241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.051670" }, { "step": 2231, "loss": 0.44448360800743103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.150332" }, { "step": 2232, "loss": 0.5882808566093445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.238397" }, { "step": 2233, "loss": 1.011368751525879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.352236" }, { "step": 2234, "loss": 0.9784140586853027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.465409" }, { "step": 2235, "loss": 0.611537754535675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.557764" }, { "step": 2236, "loss": 0.8439615368843079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.644187" }, { "step": 2237, "loss": 0.5794658064842224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.742855" }, { "step": 2238, "loss": 0.6905092000961304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.837052" }, { "step": 2239, "loss": 0.8778727054595947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:07.932703" }, { "step": 2240, "loss": 0.7513993978500366, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.024083" }, { "step": 2241, "loss": 0.7658003568649292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.142137" }, { "step": 2242, "loss": 1.1147640943527222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.252343" }, { "step": 2243, "loss": 0.8175036907196045, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.361694" }, { "step": 2244, "loss": 0.847907304763794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.477741" }, { "step": 2245, "loss": 0.9478477239608765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.580960" }, { "step": 2246, "loss": 0.47353649139404297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.676702" }, { "step": 2247, "loss": 0.7375133633613586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.762044" }, { "step": 2248, "loss": 0.8391348719596863, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.858484" }, { "step": 2249, "loss": 0.9557561874389648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:08.945901" }, { "step": 2250, "loss": 0.8712379932403564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.057213" }, { "step": 2251, "loss": 0.8747225999832153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.150276" }, { "step": 2252, "loss": 0.9357011318206787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.235966" }, { "step": 2253, "loss": 0.8513723015785217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.324597" }, { "step": 2254, "loss": 1.1454885005950928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.410246" }, { "step": 2255, "loss": 0.7711843252182007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.506996" }, { "step": 2256, "loss": 0.7287879586219788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.616070" }, { "step": 2257, "loss": 0.9378596544265747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.731318" }, { "step": 2258, "loss": 0.7059426307678223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.831526" }, { "step": 2259, "loss": 0.7905710935592651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:09.926814" }, { "step": 2260, "loss": 0.7242194414138794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.054289" }, { "step": 2261, "loss": 0.8655166625976562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.169054" }, { "step": 2262, "loss": 0.7734136581420898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.256429" }, { "step": 2263, "loss": 0.9726660847663879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.343492" }, { "step": 2264, "loss": 0.7142245769500732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.432018" }, { "step": 2265, "loss": 0.992193341255188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.518221" }, { "step": 2266, "loss": 0.6759348511695862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.611580" }, { "step": 2267, "loss": 0.6004000306129456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.696376" }, { "step": 2268, "loss": 1.19943106174469, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.781848" }, { "step": 2269, "loss": 0.7896913290023804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:10.902104" }, { "step": 2270, "loss": 0.7869384288787842, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.025896" }, { "step": 2271, "loss": 1.0361709594726562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.123051" }, { "step": 2272, "loss": 1.0664362907409668, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.207476" }, { "step": 2273, "loss": 0.5452553033828735, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.301346" }, { "step": 2274, "loss": 0.40225836634635925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.394663" }, { "step": 2275, "loss": 0.8407100439071655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.479861" }, { "step": 2276, "loss": 0.676964282989502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.566157" }, { "step": 2277, "loss": 0.6937047839164734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.651368" }, { "step": 2278, "loss": 0.5010048151016235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.745287" }, { "step": 2279, "loss": 0.6105594038963318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.858555" }, { "step": 2280, "loss": 0.6180406808853149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:11.950767" }, { "step": 2281, "loss": 1.0297950506210327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.051588" }, { "step": 2282, "loss": 0.76450514793396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.172915" }, { "step": 2283, "loss": 0.5822180509567261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.267221" }, { "step": 2284, "loss": 0.566291332244873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.353278" }, { "step": 2285, "loss": 1.0329610109329224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.438633" }, { "step": 2286, "loss": 0.5563249588012695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.530975" }, { "step": 2287, "loss": 0.5168514251708984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.635027" }, { "step": 2288, "loss": 0.9988799095153809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.722842" }, { "step": 2289, "loss": 0.6697511672973633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.813491" }, { "step": 2290, "loss": 0.8027690052986145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.906997" }, { "step": 2291, "loss": 0.721511721611023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:12.998435" }, { "step": 2292, "loss": 0.9295133352279663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.083932" }, { "step": 2293, "loss": 0.7832179069519043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.170748" }, { "step": 2294, "loss": 0.44075334072113037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.263650" }, { "step": 2295, "loss": 0.650448203086853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.358484" }, { "step": 2296, "loss": 0.8282707929611206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.451629" }, { "step": 2297, "loss": 0.8462172746658325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.568902" }, { "step": 2298, "loss": 0.8324995636940002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.689464" }, { "step": 2299, "loss": 0.4813624620437622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.782082" }, { "step": 2300, "loss": 0.6936866641044617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:13.912093" }, { "step": 2301, "loss": 0.6642893552780151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.037902" }, { "step": 2302, "loss": 0.5488666892051697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.128493" }, { "step": 2303, "loss": 1.1932227611541748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.221709" }, { "step": 2304, "loss": 0.895733118057251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.330274" }, { "step": 2305, "loss": 0.6423083543777466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.417500" }, { "step": 2306, "loss": 1.098591685295105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.529997" }, { "step": 2307, "loss": 1.0600066184997559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.621552" }, { "step": 2308, "loss": 1.0905416011810303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.771930" }, { "step": 2309, "loss": 0.8678314685821533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.865226" }, { "step": 2310, "loss": 0.9953528642654419, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:14.949720" }, { "step": 2311, "loss": 0.8002020716667175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.047969" }, { "step": 2312, "loss": 0.7027350068092346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.143842" }, { "step": 2313, "loss": 0.7659244537353516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.237106" }, { "step": 2314, "loss": 0.9989719390869141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.348423" }, { "step": 2315, "loss": 0.6724352836608887, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.493380" }, { "step": 2316, "loss": 0.8195427060127258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.579418" }, { "step": 2317, "loss": 0.9714542627334595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.670046" }, { "step": 2318, "loss": 0.7961300611495972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.755090" }, { "step": 2319, "loss": 0.7261470556259155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.845503" }, { "step": 2320, "loss": 0.7505465745925903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:15.937769" }, { "step": 2321, "loss": 0.4882180690765381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.028888" }, { "step": 2322, "loss": 0.9337656497955322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.118476" }, { "step": 2323, "loss": 0.6063697934150696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.204126" }, { "step": 2324, "loss": 0.6531232595443726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.290203" }, { "step": 2325, "loss": 0.898598313331604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.403965" }, { "step": 2326, "loss": 0.6746120452880859, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.493434" }, { "step": 2327, "loss": 0.7715129852294922, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.593821" }, { "step": 2328, "loss": 0.3962881565093994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.693026" }, { "step": 2329, "loss": 0.38545557856559753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.794067" }, { "step": 2330, "loss": 0.8595545887947083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.880304" }, { "step": 2331, "loss": 0.6607144474983215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:16.974248" }, { "step": 2332, "loss": 0.8590443134307861, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.073015" }, { "step": 2333, "loss": 0.9635311365127563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.194281" }, { "step": 2334, "loss": 0.48304879665374756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.279098" }, { "step": 2335, "loss": 0.877820611000061, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.381374" }, { "step": 2336, "loss": 0.8392512798309326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.470882" }, { "step": 2337, "loss": 0.7093725800514221, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.555643" }, { "step": 2338, "loss": 0.39966467022895813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.649191" }, { "step": 2339, "loss": 0.4893294870853424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.742791" }, { "step": 2340, "loss": 0.5726196765899658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.828615" }, { "step": 2341, "loss": 0.8224740028381348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:17.917040" }, { "step": 2342, "loss": 0.391817569732666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.002430" }, { "step": 2343, "loss": 0.6932047605514526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.122076" }, { "step": 2344, "loss": 0.49650150537490845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.222223" }, { "step": 2345, "loss": 0.9491152763366699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.309715" }, { "step": 2346, "loss": 0.6644223928451538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.396037" }, { "step": 2347, "loss": 0.8159900307655334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.509878" }, { "step": 2348, "loss": 0.7903963923454285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.604480" }, { "step": 2349, "loss": 0.4687157869338989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.698151" }, { "step": 2350, "loss": 0.8107753396034241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.790965" }, { "step": 2351, "loss": 1.0227230787277222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.886491" }, { "step": 2352, "loss": 0.495029091835022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:18.986863" }, { "step": 2353, "loss": 0.5662938952445984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.072445" }, { "step": 2354, "loss": 0.533187747001648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.169709" }, { "step": 2355, "loss": 0.8431695699691772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.286657" }, { "step": 2356, "loss": 0.7227425575256348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.376256" }, { "step": 2357, "loss": 0.8085408806800842, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.469534" }, { "step": 2358, "loss": 0.6067893505096436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.560614" }, { "step": 2359, "loss": 0.7411522269248962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.645952" }, { "step": 2360, "loss": 0.885342538356781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.763154" }, { "step": 2361, "loss": 0.4535307288169861, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.855207" }, { "step": 2362, "loss": 0.49838322401046753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:19.945800" }, { "step": 2363, "loss": 0.9010220766067505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.030177" }, { "step": 2364, "loss": 0.6115921139717102, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.156318" }, { "step": 2365, "loss": 0.9138056039810181, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.248249" }, { "step": 2366, "loss": 0.6898201107978821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.345648" }, { "step": 2367, "loss": 0.7308764457702637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.439510" }, { "step": 2368, "loss": 0.4144588112831116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.538694" }, { "step": 2369, "loss": 0.5613586902618408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.629329" }, { "step": 2370, "loss": 0.6909253597259521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.716690" }, { "step": 2371, "loss": 0.8298625946044922, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.802217" }, { "step": 2372, "loss": 0.7843093872070312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.912077" }, { "step": 2373, "loss": 1.0378042459487915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:20.999441" }, { "step": 2374, "loss": 0.6411300897598267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.091433" }, { "step": 2375, "loss": 0.790508508682251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.176446" }, { "step": 2376, "loss": 0.6701394319534302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.267339" }, { "step": 2377, "loss": 0.676306962966919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.375770" }, { "step": 2378, "loss": 0.9221720695495605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.469896" }, { "step": 2379, "loss": 0.8012794852256775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.587013" }, { "step": 2380, "loss": 0.521330714225769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.680095" }, { "step": 2381, "loss": 1.2749272584915161, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.766606" }, { "step": 2382, "loss": 0.7815191149711609, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.874515" }, { "step": 2383, "loss": 0.7188379764556885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:21.971058" }, { "step": 2384, "loss": 1.0565260648727417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.093998" }, { "step": 2385, "loss": 0.8430009484291077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.206223" }, { "step": 2386, "loss": 0.738307774066925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.291581" }, { "step": 2387, "loss": 0.6400051116943359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.387686" }, { "step": 2388, "loss": 1.1862449645996094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.485502" }, { "step": 2389, "loss": 0.9537123441696167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.600680" }, { "step": 2390, "loss": 0.9397864937782288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.709353" }, { "step": 2391, "loss": 0.7508140802383423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.797752" }, { "step": 2392, "loss": 0.8122209906578064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.892805" }, { "step": 2393, "loss": 0.7606380581855774, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:22.983294" }, { "step": 2394, "loss": 0.4543752074241638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.075629" }, { "step": 2395, "loss": 0.6577134132385254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.169617" }, { "step": 2396, "loss": 0.7623952627182007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.289393" }, { "step": 2397, "loss": 0.8146102428436279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.375634" }, { "step": 2398, "loss": 0.9625040292739868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.486049" }, { "step": 2399, "loss": 0.8448487520217896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.580242" }, { "step": 2400, "loss": 0.7029311656951904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.668703" }, { "step": 2401, "loss": 0.4785936772823334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.756292" }, { "step": 2402, "loss": 1.2009385824203491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.848519" }, { "step": 2403, "loss": 0.682902455329895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:23.940056" }, { "step": 2404, "loss": 0.795539915561676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.037327" }, { "step": 2405, "loss": 0.6281712651252747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.135488" }, { "step": 2406, "loss": 0.6224493384361267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.222793" }, { "step": 2407, "loss": 0.6045218706130981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.337507" }, { "step": 2408, "loss": 0.548869788646698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.434533" }, { "step": 2409, "loss": 0.5905240774154663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.544359" }, { "step": 2410, "loss": 0.915543794631958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.632754" }, { "step": 2411, "loss": 0.9716109037399292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.719396" }, { "step": 2412, "loss": 0.8763704895973206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.808234" }, { "step": 2413, "loss": 0.835075855255127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:24.927237" }, { "step": 2414, "loss": 0.414737731218338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.016252" }, { "step": 2415, "loss": 0.7149311900138855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.105766" }, { "step": 2416, "loss": 0.7224946618080139, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.193563" }, { "step": 2417, "loss": 0.7222709059715271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.279496" }, { "step": 2418, "loss": 0.6474984884262085, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.370980" }, { "step": 2419, "loss": 1.0851384401321411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.492782" }, { "step": 2420, "loss": 0.7350620031356812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.578401" }, { "step": 2421, "loss": 0.7846438884735107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.664816" }, { "step": 2422, "loss": 0.496249794960022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.761187" }, { "step": 2423, "loss": 0.6857386231422424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.856912" }, { "step": 2424, "loss": 0.785902738571167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:25.960427" }, { "step": 2425, "loss": 0.823164165019989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.053624" }, { "step": 2426, "loss": 0.6089905500411987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.146890" }, { "step": 2427, "loss": 0.6161006093025208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.232934" }, { "step": 2428, "loss": 0.6914026737213135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.330214" }, { "step": 2429, "loss": 1.0494831800460815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.415498" }, { "step": 2430, "loss": 0.8074585199356079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.502614" }, { "step": 2431, "loss": 0.9308614134788513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.617544" }, { "step": 2432, "loss": 0.45555001497268677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.702441" }, { "step": 2433, "loss": 0.5789811611175537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.788539" }, { "step": 2434, "loss": 0.9189757108688354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.875033" }, { "step": 2435, "loss": 0.587978720664978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:26.994251" }, { "step": 2436, "loss": 0.46555954217910767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.093632" }, { "step": 2437, "loss": 0.87619948387146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.187502" }, { "step": 2438, "loss": 0.5989755392074585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.282958" }, { "step": 2439, "loss": 0.6185493469238281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.370907" }, { "step": 2440, "loss": 0.7021997570991516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.468450" }, { "step": 2441, "loss": 0.8423775434494019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.554611" }, { "step": 2442, "loss": 0.8127433061599731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.651242" }, { "step": 2443, "loss": 0.6935682892799377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.745012" }, { "step": 2444, "loss": 0.7281489372253418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.836681" }, { "step": 2445, "loss": 0.7780873775482178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:27.929236" }, { "step": 2446, "loss": 0.8179944157600403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.040507" }, { "step": 2447, "loss": 0.5926216840744019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.126120" }, { "step": 2448, "loss": 0.47013893723487854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.214257" }, { "step": 2449, "loss": 0.6504830121994019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.314780" }, { "step": 2450, "loss": 0.8111204504966736, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.407576" }, { "step": 2451, "loss": 0.6939178705215454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.502844" }, { "step": 2452, "loss": 1.091234564781189, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.616892" }, { "step": 2453, "loss": 0.7216335535049438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.706694" }, { "step": 2454, "loss": 1.088988184928894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.797864" }, { "step": 2455, "loss": 0.6507583260536194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:28.912488" }, { "step": 2456, "loss": 0.6258532404899597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.000514" }, { "step": 2457, "loss": 0.998282253742218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.097529" }, { "step": 2458, "loss": 0.9019399881362915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.184191" }, { "step": 2459, "loss": 0.5302679538726807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.269310" }, { "step": 2460, "loss": 0.5611511468887329, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.358137" }, { "step": 2461, "loss": 0.5556972026824951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.448062" }, { "step": 2462, "loss": 0.6598821878433228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.533832" }, { "step": 2463, "loss": 0.6352054476737976, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.619347" }, { "step": 2464, "loss": 0.568688154220581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.703980" }, { "step": 2465, "loss": 0.9146718978881836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.815720" }, { "step": 2466, "loss": 0.8370286822319031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:29.910517" }, { "step": 2467, "loss": 0.856575608253479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.027422" }, { "step": 2468, "loss": 0.6018224954605103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.120880" }, { "step": 2469, "loss": 0.7751474380493164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.209114" }, { "step": 2470, "loss": 0.6044608354568481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.300546" }, { "step": 2471, "loss": 0.7112745642662048, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.394740" }, { "step": 2472, "loss": 1.1046947240829468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.479742" }, { "step": 2473, "loss": 1.0644843578338623, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.570312" }, { "step": 2474, "loss": 1.0164117813110352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.710637" }, { "step": 2475, "loss": 0.6304817199707031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.800777" }, { "step": 2476, "loss": 0.9973293542861938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.885996" }, { "step": 2477, "loss": 0.5912042260169983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:30.999391" }, { "step": 2478, "loss": 0.4869474768638611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.098145" }, { "step": 2479, "loss": 0.7459206581115723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.195106" }, { "step": 2480, "loss": 1.0250977277755737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.308085" }, { "step": 2481, "loss": 0.6517376899719238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.391438" }, { "step": 2482, "loss": 0.5907399654388428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.485671" }, { "step": 2483, "loss": 0.6639254689216614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.574525" }, { "step": 2484, "loss": 1.1983017921447754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.658657" }, { "step": 2485, "loss": 0.9568012952804565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.743236" }, { "step": 2486, "loss": 0.7290898561477661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.837131" }, { "step": 2487, "loss": 0.6400020122528076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:31.930930" }, { "step": 2488, "loss": 0.9718666076660156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.046210" }, { "step": 2489, "loss": 0.7922481298446655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.140128" }, { "step": 2490, "loss": 0.5500238537788391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.240900" }, { "step": 2491, "loss": 1.1273106336593628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.349604" }, { "step": 2492, "loss": 0.5279348492622375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.442571" }, { "step": 2493, "loss": 0.42348363995552063, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.538238" }, { "step": 2494, "loss": 0.6803842782974243, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.631473" }, { "step": 2495, "loss": 1.0078859329223633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.727700" }, { "step": 2496, "loss": 0.9476116299629211, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.816095" }, { "step": 2497, "loss": 0.7056638598442078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:32.936408" }, { "step": 2498, "loss": 0.6268693208694458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:33.024564" }, { "step": 2499, "loss": 0.6188063621520996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:33.115653" }, { "step": 2500, "loss": 0.7835406064987183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:33.201878" }, { "step": 2501, "loss": 0.5020826458930969, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:55.742404" }, { "step": 2502, "loss": 0.6188787221908569, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:55.832800" }, { "step": 2503, "loss": 0.9761694669723511, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:55.942633" }, { "step": 2504, "loss": 0.6817021369934082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.060180" }, { "step": 2505, "loss": 0.48830604553222656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.157905" }, { "step": 2506, "loss": 0.3941631317138672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.245806" }, { "step": 2507, "loss": 0.7888896465301514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.329424" }, { "step": 2508, "loss": 0.46367502212524414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.417956" }, { "step": 2509, "loss": 0.5349787473678589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.507290" }, { "step": 2510, "loss": 0.6414687037467957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.596696" }, { "step": 2511, "loss": 0.7746042609214783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.682454" }, { "step": 2512, "loss": 0.48442739248275757, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.776535" }, { "step": 2513, "loss": 0.6899077892303467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:56.894671" }, { "step": 2514, "loss": 0.6217575073242188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.012468" }, { "step": 2515, "loss": 1.0282800197601318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.096347" }, { "step": 2516, "loss": 0.8735329508781433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.181874" }, { "step": 2517, "loss": 0.6483060717582703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.266905" }, { "step": 2518, "loss": 0.40003207325935364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.357516" }, { "step": 2519, "loss": 0.7258505821228027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.446427" }, { "step": 2520, "loss": 1.0314154624938965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.586121" }, { "step": 2521, "loss": 0.7141712307929993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.683010" }, { "step": 2522, "loss": 0.4089149832725525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.774278" }, { "step": 2523, "loss": 0.8631540536880493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.893259" }, { "step": 2524, "loss": 0.6050288677215576, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:57.979535" }, { "step": 2525, "loss": 0.6843096017837524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.076356" }, { "step": 2526, "loss": 0.3246791362762451, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.166081" }, { "step": 2527, "loss": 0.7796032428741455, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.262346" }, { "step": 2528, "loss": 0.5096229314804077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.354026" }, { "step": 2529, "loss": 0.7060723304748535, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.473465" }, { "step": 2530, "loss": 1.006749153137207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.559433" }, { "step": 2531, "loss": 0.6414542198181152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.649619" }, { "step": 2532, "loss": 0.8463432788848877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.764609" }, { "step": 2533, "loss": 0.5164538621902466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.853388" }, { "step": 2534, "loss": 0.8751550912857056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:58.942349" }, { "step": 2535, "loss": 0.7038036584854126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.046056" }, { "step": 2536, "loss": 0.8576943874359131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.153487" }, { "step": 2537, "loss": 0.827365517616272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.239646" }, { "step": 2538, "loss": 1.0514016151428223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.326877" }, { "step": 2539, "loss": 0.9825515747070312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.412816" }, { "step": 2540, "loss": 0.5250961780548096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.500430" }, { "step": 2541, "loss": 0.8229261636734009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.597962" }, { "step": 2542, "loss": 0.8144568204879761, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.686566" }, { "step": 2543, "loss": 0.985672116279602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.789877" }, { "step": 2544, "loss": 1.0246742963790894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.898853" }, { "step": 2545, "loss": 0.7819309234619141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:28:59.986234" }, { "step": 2546, "loss": 0.41621455550193787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.077985" }, { "step": 2547, "loss": 0.6836720705032349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.192396" }, { "step": 2548, "loss": 0.8197433948516846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.287666" }, { "step": 2549, "loss": 0.7268252372741699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.382858" }, { "step": 2550, "loss": 0.6627832055091858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.467646" }, { "step": 2551, "loss": 0.37895655632019043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.561534" }, { "step": 2552, "loss": 0.9030309915542603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.648183" }, { "step": 2553, "loss": 0.8244903087615967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.732425" }, { "step": 2554, "loss": 0.5994800329208374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.825131" }, { "step": 2555, "loss": 0.7935681939125061, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:00.919525" }, { "step": 2556, "loss": 0.8765281438827515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.008776" }, { "step": 2557, "loss": 0.8146405816078186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.099348" }, { "step": 2558, "loss": 0.8630602359771729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.183410" }, { "step": 2559, "loss": 0.5862079858779907, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.284733" }, { "step": 2560, "loss": 0.8341888785362244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.378122" }, { "step": 2561, "loss": 0.6613426208496094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.479287" }, { "step": 2562, "loss": 1.2153589725494385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.574526" }, { "step": 2563, "loss": 0.8769479990005493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.688428" }, { "step": 2564, "loss": 0.8255680799484253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.777421" }, { "step": 2565, "loss": 0.44914209842681885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.862786" }, { "step": 2566, "loss": 0.5528694987297058, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:01.952487" }, { "step": 2567, "loss": 0.821009635925293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.039094" }, { "step": 2568, "loss": 0.8972693085670471, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.162355" }, { "step": 2569, "loss": 0.6996124386787415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.251757" }, { "step": 2570, "loss": 0.6707334518432617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.338831" }, { "step": 2571, "loss": 0.7307754755020142, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.431762" }, { "step": 2572, "loss": 0.7486584186553955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.530116" }, { "step": 2573, "loss": 0.6178475618362427, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.615346" }, { "step": 2574, "loss": 0.5694226622581482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.711454" }, { "step": 2575, "loss": 0.8615165948867798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.829186" }, { "step": 2576, "loss": 0.5644221305847168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:02.914084" }, { "step": 2577, "loss": 0.8887470960617065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.037489" }, { "step": 2578, "loss": 0.9534226059913635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.131718" }, { "step": 2579, "loss": 0.5991899967193604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.230465" }, { "step": 2580, "loss": 0.7827955484390259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.348493" }, { "step": 2581, "loss": 1.1470221281051636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.437090" }, { "step": 2582, "loss": 0.7651423215866089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.530309" }, { "step": 2583, "loss": 0.6220911741256714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.616349" }, { "step": 2584, "loss": 0.7601522207260132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.733042" }, { "step": 2585, "loss": 1.063822627067566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.817537" }, { "step": 2586, "loss": 0.7886562347412109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:03.927210" }, { "step": 2587, "loss": 1.127117395401001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.012224" }, { "step": 2588, "loss": 0.8666239976882935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.104551" }, { "step": 2589, "loss": 0.6858737468719482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.189798" }, { "step": 2590, "loss": 0.6970254182815552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.289923" }, { "step": 2591, "loss": 0.8785386681556702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.382726" }, { "step": 2592, "loss": 0.8188069462776184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.503229" }, { "step": 2593, "loss": 0.9157566428184509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.613982" }, { "step": 2594, "loss": 0.8524659872055054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.723919" }, { "step": 2595, "loss": 0.7706726789474487, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.809024" }, { "step": 2596, "loss": 0.7229438424110413, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:04.940563" }, { "step": 2597, "loss": 0.6382002234458923, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.032605" }, { "step": 2598, "loss": 0.5409920811653137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.117664" }, { "step": 2599, "loss": 0.6810676455497742, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.220672" }, { "step": 2600, "loss": 0.551073431968689, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.313919" }, { "step": 2601, "loss": 0.5454932451248169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.406428" }, { "step": 2602, "loss": 0.937493085861206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.516526" }, { "step": 2603, "loss": 0.3570401072502136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.605887" }, { "step": 2604, "loss": 0.6878910064697266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.697052" }, { "step": 2605, "loss": 0.882649302482605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.806722" }, { "step": 2606, "loss": 0.5852093696594238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:05.903078" }, { "step": 2607, "loss": 0.9058747291564941, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.011197" }, { "step": 2608, "loss": 1.2520828247070312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.103618" }, { "step": 2609, "loss": 0.45540979504585266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.195948" }, { "step": 2610, "loss": 0.5740227699279785, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.295750" }, { "step": 2611, "loss": 0.7095811367034912, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.382191" }, { "step": 2612, "loss": 0.617868959903717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.476824" }, { "step": 2613, "loss": 0.4799753427505493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.570677" }, { "step": 2614, "loss": 0.5068426728248596, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.662150" }, { "step": 2615, "loss": 0.8209301829338074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.757240" }, { "step": 2616, "loss": 0.7799237966537476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.842608" }, { "step": 2617, "loss": 0.7035263776779175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:06.963641" }, { "step": 2618, "loss": 0.4719783663749695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.064579" }, { "step": 2619, "loss": 0.8087038993835449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.156643" }, { "step": 2620, "loss": 1.0211254358291626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.279064" }, { "step": 2621, "loss": 0.5658661127090454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.371130" }, { "step": 2622, "loss": 0.48025912046432495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.457930" }, { "step": 2623, "loss": 0.8613036870956421, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.543205" }, { "step": 2624, "loss": 0.8467830419540405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.629456" }, { "step": 2625, "loss": 0.27665311098098755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.715525" }, { "step": 2626, "loss": 0.8700153231620789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.811274" }, { "step": 2627, "loss": 0.5804354548454285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.909806" }, { "step": 2628, "loss": 0.7234228253364563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:07.998881" }, { "step": 2629, "loss": 0.6706821918487549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.082206" }, { "step": 2630, "loss": 0.6644691824913025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.179381" }, { "step": 2631, "loss": 0.6807067394256592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.275292" }, { "step": 2632, "loss": 0.7379690408706665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.373905" }, { "step": 2633, "loss": 0.5995013117790222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.458448" }, { "step": 2634, "loss": 0.8792905807495117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.568263" }, { "step": 2635, "loss": 0.878854513168335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.655794" }, { "step": 2636, "loss": 0.47721683979034424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.742678" }, { "step": 2637, "loss": 0.8594365119934082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.834162" }, { "step": 2638, "loss": 0.5999180674552917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:08.919301" }, { "step": 2639, "loss": 0.6044289469718933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.007998" }, { "step": 2640, "loss": 0.7208973169326782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.118489" }, { "step": 2641, "loss": 0.5151590704917908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.218389" }, { "step": 2642, "loss": 0.5373598337173462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.305686" }, { "step": 2643, "loss": 0.9337553977966309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.426141" }, { "step": 2644, "loss": 0.7292783260345459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.545519" }, { "step": 2645, "loss": 0.8219776153564453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.660150" }, { "step": 2646, "loss": 0.7183732390403748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.745300" }, { "step": 2647, "loss": 0.8202007412910461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.838164" }, { "step": 2648, "loss": 0.5913441181182861, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:09.930548" }, { "step": 2649, "loss": 0.8615386486053467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.019678" }, { "step": 2650, "loss": 0.9343962073326111, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.139822" }, { "step": 2651, "loss": 0.41572850942611694, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.238246" }, { "step": 2652, "loss": 0.5814489126205444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.330585" }, { "step": 2653, "loss": 0.7445780038833618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.443482" }, { "step": 2654, "loss": 0.6662389636039734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.536882" }, { "step": 2655, "loss": 0.5250306129455566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.623597" }, { "step": 2656, "loss": 0.5164401531219482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.714952" }, { "step": 2657, "loss": 0.4482346177101135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.810335" }, { "step": 2658, "loss": 0.7564611434936523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.902234" }, { "step": 2659, "loss": 0.6799054741859436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:10.988763" }, { "step": 2660, "loss": 0.7482221722602844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.075911" }, { "step": 2661, "loss": 0.7973361015319824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.174894" }, { "step": 2662, "loss": 0.6417836546897888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.266285" }, { "step": 2663, "loss": 0.728691577911377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.360623" }, { "step": 2664, "loss": 0.3751223683357239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.453457" }, { "step": 2665, "loss": 1.1043704748153687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.545952" }, { "step": 2666, "loss": 0.6816450357437134, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.662126" }, { "step": 2667, "loss": 0.6968179941177368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.763362" }, { "step": 2668, "loss": 1.0161278247833252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.848487" }, { "step": 2669, "loss": 0.9577001333236694, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:11.940010" }, { "step": 2670, "loss": 1.0913058519363403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.085733" }, { "step": 2671, "loss": 0.7297818660736084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.171148" }, { "step": 2672, "loss": 0.67213374376297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.272773" }, { "step": 2673, "loss": 0.48098504543304443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.360488" }, { "step": 2674, "loss": 0.9531916975975037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.453987" }, { "step": 2675, "loss": 0.7171496748924255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.545991" }, { "step": 2676, "loss": 0.7367916703224182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.635910" }, { "step": 2677, "loss": 0.7872375249862671, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.728300" }, { "step": 2678, "loss": 0.8762933015823364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.821870" }, { "step": 2679, "loss": 0.6657413244247437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:12.936967" }, { "step": 2680, "loss": 0.6500644087791443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.023325" }, { "step": 2681, "loss": 0.614724338054657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.116334" }, { "step": 2682, "loss": 0.7034215927124023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.206741" }, { "step": 2683, "loss": 0.5032481551170349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.307980" }, { "step": 2684, "loss": 0.47474706172943115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.407248" }, { "step": 2685, "loss": 0.9131549596786499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.517237" }, { "step": 2686, "loss": 0.8668311834335327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.611767" }, { "step": 2687, "loss": 0.7085867524147034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.700024" }, { "step": 2688, "loss": 1.029914140701294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.811462" }, { "step": 2689, "loss": 0.9745534658432007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.896139" }, { "step": 2690, "loss": 0.48471909761428833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:13.993513" }, { "step": 2691, "loss": 0.8959150314331055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.079721" }, { "step": 2692, "loss": 0.7273302674293518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.180206" }, { "step": 2693, "loss": 0.6105005741119385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.265323" }, { "step": 2694, "loss": 0.9476595520973206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.378923" }, { "step": 2695, "loss": 0.8910791873931885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.469564" }, { "step": 2696, "loss": 0.6672957539558411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.560767" }, { "step": 2697, "loss": 0.9937787652015686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.672040" }, { "step": 2698, "loss": 0.48964864015579224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.772899" }, { "step": 2699, "loss": 0.7030453681945801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.871308" }, { "step": 2700, "loss": 0.46673762798309326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:14.963937" }, { "step": 2701, "loss": 0.4387911260128021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.048580" }, { "step": 2702, "loss": 0.8058011531829834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.140029" }, { "step": 2703, "loss": 0.7079870104789734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.235757" }, { "step": 2704, "loss": 0.8024710416793823, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.318021" }, { "step": 2705, "loss": 0.47672683000564575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.410194" }, { "step": 2706, "loss": 0.8778222799301147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.519089" }, { "step": 2707, "loss": 0.652590274810791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.612524" }, { "step": 2708, "loss": 1.024023175239563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.719951" }, { "step": 2709, "loss": 1.006188988685608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.817316" }, { "step": 2710, "loss": 0.8633742332458496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.907733" }, { "step": 2711, "loss": 0.716429591178894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:15.995602" }, { "step": 2712, "loss": 0.6673677563667297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.082533" }, { "step": 2713, "loss": 0.5497224926948547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.165145" }, { "step": 2714, "loss": 0.5813795924186707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.253922" }, { "step": 2715, "loss": 0.6400980949401855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.340325" }, { "step": 2716, "loss": 0.6697051525115967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.425817" }, { "step": 2717, "loss": 0.806524395942688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.523299" }, { "step": 2718, "loss": 0.8512616157531738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.607819" }, { "step": 2719, "loss": 0.5049362778663635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.707115" }, { "step": 2720, "loss": 0.8332846164703369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.801200" }, { "step": 2721, "loss": 0.908505380153656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.887409" }, { "step": 2722, "loss": 1.0377247333526611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:16.973486" }, { "step": 2723, "loss": 0.60942143201828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.062668" }, { "step": 2724, "loss": 0.6302022337913513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.147963" }, { "step": 2725, "loss": 0.444186806678772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.234945" }, { "step": 2726, "loss": 0.692409098148346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.329575" }, { "step": 2727, "loss": 0.9896422624588013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.446064" }, { "step": 2728, "loss": 0.584827184677124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.539854" }, { "step": 2729, "loss": 0.30976948142051697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.632247" }, { "step": 2730, "loss": 0.8681372404098511, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.717467" }, { "step": 2731, "loss": 0.9589040875434875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.811133" }, { "step": 2732, "loss": 0.5368110537528992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.903288" }, { "step": 2733, "loss": 0.7482609152793884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:17.989361" }, { "step": 2734, "loss": 0.5359793305397034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.089063" }, { "step": 2735, "loss": 0.6181921362876892, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.198806" }, { "step": 2736, "loss": 1.2343846559524536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.283985" }, { "step": 2737, "loss": 0.8444353342056274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.395250" }, { "step": 2738, "loss": 0.4275621771812439, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.480532" }, { "step": 2739, "loss": 0.7001984119415283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.565391" }, { "step": 2740, "loss": 0.8995749950408936, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.701152" }, { "step": 2741, "loss": 0.6074145436286926, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.787222" }, { "step": 2742, "loss": 0.5635940432548523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.879099" }, { "step": 2743, "loss": 0.980613112449646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:18.975096" }, { "step": 2744, "loss": 0.6281070709228516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.100724" }, { "step": 2745, "loss": 0.6499900221824646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.187431" }, { "step": 2746, "loss": 0.5830938816070557, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.275919" }, { "step": 2747, "loss": 0.6785446405410767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.365951" }, { "step": 2748, "loss": 0.6968251466751099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.457517" }, { "step": 2749, "loss": 0.6434208750724792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.546411" }, { "step": 2750, "loss": 0.6022109985351562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.661246" }, { "step": 2751, "loss": 1.293239951133728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.747968" }, { "step": 2752, "loss": 0.6060115098953247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.836235" }, { "step": 2753, "loss": 0.6781842112541199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:19.921204" }, { "step": 2754, "loss": 0.5476868748664856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.005807" }, { "step": 2755, "loss": 0.7023114562034607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.099713" }, { "step": 2756, "loss": 0.36635273694992065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.187543" }, { "step": 2757, "loss": 0.6464948058128357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.279458" }, { "step": 2758, "loss": 0.7703419923782349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.370179" }, { "step": 2759, "loss": 0.8035709857940674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.468480" }, { "step": 2760, "loss": 1.1070137023925781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.584395" }, { "step": 2761, "loss": 0.668282151222229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.677937" }, { "step": 2762, "loss": 0.9800070524215698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.811753" }, { "step": 2763, "loss": 0.7638179063796997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:20.898152" }, { "step": 2764, "loss": 0.9866782426834106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.012080" }, { "step": 2765, "loss": 0.6056482195854187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.102880" }, { "step": 2766, "loss": 0.6477876901626587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.191324" }, { "step": 2767, "loss": 0.8706508278846741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.286103" }, { "step": 2768, "loss": 0.6932101249694824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.387525" }, { "step": 2769, "loss": 0.550776481628418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.477803" }, { "step": 2770, "loss": 0.5248023867607117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.577145" }, { "step": 2771, "loss": 0.3951207399368286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.667810" }, { "step": 2772, "loss": 0.6851232647895813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.780690" }, { "step": 2773, "loss": 0.8017231225967407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.878254" }, { "step": 2774, "loss": 1.1121078729629517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:21.963349" }, { "step": 2775, "loss": 0.7815440893173218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.051393" }, { "step": 2776, "loss": 0.8747097849845886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.173049" }, { "step": 2777, "loss": 1.1350957155227661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.258847" }, { "step": 2778, "loss": 0.7207091450691223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.348466" }, { "step": 2779, "loss": 0.7272195816040039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.437767" }, { "step": 2780, "loss": 0.7450095415115356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.527600" }, { "step": 2781, "loss": 0.4850429892539978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.613596" }, { "step": 2782, "loss": 0.6368022561073303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.700279" }, { "step": 2783, "loss": 0.37713754177093506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.795981" }, { "step": 2784, "loss": 0.5899025201797485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.899145" }, { "step": 2785, "loss": 0.7101075649261475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:22.992119" }, { "step": 2786, "loss": 0.6599434614181519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.079592" }, { "step": 2787, "loss": 0.5038039684295654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.180477" }, { "step": 2788, "loss": 0.7852099537849426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.290993" }, { "step": 2789, "loss": 0.5598618984222412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.534870" }, { "step": 2790, "loss": 0.647304356098175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.628942" }, { "step": 2791, "loss": 0.6341134309768677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.736932" }, { "step": 2792, "loss": 0.7261837720870972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.857244" }, { "step": 2793, "loss": 1.0244252681732178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:23.967737" }, { "step": 2794, "loss": 1.0827528238296509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.101678" }, { "step": 2795, "loss": 0.5935348272323608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.187863" }, { "step": 2796, "loss": 0.5269498825073242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.277241" }, { "step": 2797, "loss": 0.5465542078018188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.362543" }, { "step": 2798, "loss": 0.8190668225288391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.471743" }, { "step": 2799, "loss": 1.0172092914581299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.583266" }, { "step": 2800, "loss": 0.8212244510650635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.669919" }, { "step": 2801, "loss": 0.9793691635131836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.756912" }, { "step": 2802, "loss": 1.013411283493042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:24.890209" }, { "step": 2803, "loss": 0.5329989790916443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.017158" }, { "step": 2804, "loss": 0.6140652298927307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.110290" }, { "step": 2805, "loss": 1.0228683948516846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.229608" }, { "step": 2806, "loss": 0.7052899599075317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.318247" }, { "step": 2807, "loss": 0.9413107633590698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.403966" }, { "step": 2808, "loss": 0.3923308253288269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.489812" }, { "step": 2809, "loss": 0.5293272733688354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.579106" }, { "step": 2810, "loss": 0.7353485822677612, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.688828" }, { "step": 2811, "loss": 0.4651417136192322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.781531" }, { "step": 2812, "loss": 0.7600867748260498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:25.889949" }, { "step": 2813, "loss": 0.6944457292556763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.000058" }, { "step": 2814, "loss": 0.8244867920875549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.092214" }, { "step": 2815, "loss": 0.37728413939476013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.185122" }, { "step": 2816, "loss": 0.8854578137397766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.269640" }, { "step": 2817, "loss": 0.8826516270637512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.381987" }, { "step": 2818, "loss": 0.4425710439682007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.474631" }, { "step": 2819, "loss": 0.8548840284347534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.559758" }, { "step": 2820, "loss": 0.5470541715621948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.644554" }, { "step": 2821, "loss": 0.8537894487380981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.737131" }, { "step": 2822, "loss": 0.8548280000686646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.821633" }, { "step": 2823, "loss": 0.8310918807983398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:26.935252" }, { "step": 2824, "loss": 1.0283664464950562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.020646" }, { "step": 2825, "loss": 0.7097023725509644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.117386" }, { "step": 2826, "loss": 0.7173565626144409, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.201798" }, { "step": 2827, "loss": 0.873572587966919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.289414" }, { "step": 2828, "loss": 0.3053259551525116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.374011" }, { "step": 2829, "loss": 0.7227718830108643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.462630" }, { "step": 2830, "loss": 0.8303301334381104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.557875" }, { "step": 2831, "loss": 0.6208672523498535, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.651056" }, { "step": 2832, "loss": 0.8526721000671387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.770647" }, { "step": 2833, "loss": 0.9826372861862183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.862729" }, { "step": 2834, "loss": 0.4761836528778076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:27.959385" }, { "step": 2835, "loss": 0.7217572927474976, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.046139" }, { "step": 2836, "loss": 0.5714162588119507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.134784" }, { "step": 2837, "loss": 0.7412357926368713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.224576" }, { "step": 2838, "loss": 0.5940268039703369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.317451" }, { "step": 2839, "loss": 0.4826018810272217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.405407" }, { "step": 2840, "loss": 0.7678412199020386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.523373" }, { "step": 2841, "loss": 0.6693271398544312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.642788" }, { "step": 2842, "loss": 0.8639765977859497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.732837" }, { "step": 2843, "loss": 0.9408427476882935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.843275" }, { "step": 2844, "loss": 0.8769316077232361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:28.955857" }, { "step": 2845, "loss": 0.9287752509117126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.042800" }, { "step": 2846, "loss": 0.46223050355911255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.127960" }, { "step": 2847, "loss": 0.8006738424301147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.247067" }, { "step": 2848, "loss": 0.7442089915275574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.333349" }, { "step": 2849, "loss": 0.7644265294075012, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.439904" }, { "step": 2850, "loss": 1.0395195484161377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.552274" }, { "step": 2851, "loss": 0.8352357149124146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.636552" }, { "step": 2852, "loss": 1.0005425214767456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.747952" }, { "step": 2853, "loss": 0.2794264853000641, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.836180" }, { "step": 2854, "loss": 0.6637501120567322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:29.929527" }, { "step": 2855, "loss": 0.8784409761428833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.029144" }, { "step": 2856, "loss": 0.8390023708343506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.140061" }, { "step": 2857, "loss": 0.7867629528045654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.230623" }, { "step": 2858, "loss": 0.6287150382995605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.324137" }, { "step": 2859, "loss": 0.8170692920684814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.409407" }, { "step": 2860, "loss": 0.45576944947242737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.497812" }, { "step": 2861, "loss": 0.6290186643600464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.583763" }, { "step": 2862, "loss": 1.082993507385254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.678024" }, { "step": 2863, "loss": 0.32357582449913025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.775973" }, { "step": 2864, "loss": 0.5530069470405579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.866769" }, { "step": 2865, "loss": 0.7470005750656128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:30.980177" }, { "step": 2866, "loss": 0.7053801417350769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.070866" }, { "step": 2867, "loss": 0.5229827165603638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.156785" }, { "step": 2868, "loss": 0.7485517263412476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.272196" }, { "step": 2869, "loss": 0.8482354879379272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.358328" }, { "step": 2870, "loss": 0.6771572828292847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.444087" }, { "step": 2871, "loss": 0.762988269329071, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.537735" }, { "step": 2872, "loss": 0.8236910104751587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.622323" }, { "step": 2873, "loss": 0.7729521989822388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.716204" }, { "step": 2874, "loss": 0.7120711803436279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.828397" }, { "step": 2875, "loss": 0.661318302154541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:31.918711" }, { "step": 2876, "loss": 0.4928077459335327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.003563" }, { "step": 2877, "loss": 1.0927553176879883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.105422" }, { "step": 2878, "loss": 0.45693790912628174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.192276" }, { "step": 2879, "loss": 0.4572792053222656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.285354" }, { "step": 2880, "loss": 0.5472351312637329, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.382644" }, { "step": 2881, "loss": 0.7973991632461548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.501855" }, { "step": 2882, "loss": 0.5910221338272095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.593342" }, { "step": 2883, "loss": 0.7294446229934692, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.680152" }, { "step": 2884, "loss": 0.8213886022567749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.770977" }, { "step": 2885, "loss": 0.8404065370559692, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.856204" }, { "step": 2886, "loss": 0.8550060987472534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:32.950590" }, { "step": 2887, "loss": 0.653713583946228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.039762" }, { "step": 2888, "loss": 0.6705575585365295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.128988" }, { "step": 2889, "loss": 0.5619778633117676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.215185" }, { "step": 2890, "loss": 0.7579277753829956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.301422" }, { "step": 2891, "loss": 0.7836620211601257, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.389470" }, { "step": 2892, "loss": 0.8120193481445312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.474736" }, { "step": 2893, "loss": 0.32617199420928955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.569752" }, { "step": 2894, "loss": 0.6052587032318115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.657444" }, { "step": 2895, "loss": 1.045852541923523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.750401" }, { "step": 2896, "loss": 0.9977197647094727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.835860" }, { "step": 2897, "loss": 0.9406428337097168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:33.979263" }, { "step": 2898, "loss": 0.6090332865715027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.071328" }, { "step": 2899, "loss": 0.5991785526275635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.157600" }, { "step": 2900, "loss": 0.602517306804657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.244361" }, { "step": 2901, "loss": 0.8717185258865356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.328547" }, { "step": 2902, "loss": 0.5625187158584595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.425295" }, { "step": 2903, "loss": 1.0587315559387207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.517860" }, { "step": 2904, "loss": 0.8432915806770325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.602487" }, { "step": 2905, "loss": 0.9256998300552368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.695206" }, { "step": 2906, "loss": 0.6129046082496643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.805550" }, { "step": 2907, "loss": 1.0363798141479492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:34.912513" }, { "step": 2908, "loss": 0.7392028570175171, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.000192" }, { "step": 2909, "loss": 0.6355345249176025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.085811" }, { "step": 2910, "loss": 0.5123634338378906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.183223" }, { "step": 2911, "loss": 1.096540093421936, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.268773" }, { "step": 2912, "loss": 0.8125808238983154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.381698" }, { "step": 2913, "loss": 0.9197186231613159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.491586" }, { "step": 2914, "loss": 0.6554942727088928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.593073" }, { "step": 2915, "loss": 0.7221825122833252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.711504" }, { "step": 2916, "loss": 0.8921205997467041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.852668" }, { "step": 2917, "loss": 0.9774461984634399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:35.964578" }, { "step": 2918, "loss": 0.9121456742286682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.050297" }, { "step": 2919, "loss": 0.8587324619293213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.170872" }, { "step": 2920, "loss": 0.6040313243865967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.264994" }, { "step": 2921, "loss": 0.42432165145874023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.357706" }, { "step": 2922, "loss": 1.0121948719024658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.486167" }, { "step": 2923, "loss": 0.7274143695831299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.580706" }, { "step": 2924, "loss": 0.3753930330276489, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.673076" }, { "step": 2925, "loss": 1.0722471475601196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.760433" }, { "step": 2926, "loss": 0.6751022338867188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.865837" }, { "step": 2927, "loss": 0.8744615316390991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:36.952614" }, { "step": 2928, "loss": 1.0123134851455688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.041199" }, { "step": 2929, "loss": 0.4335968494415283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.129420" }, { "step": 2930, "loss": 0.6348329782485962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.216525" }, { "step": 2931, "loss": 1.162420630455017, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.305369" }, { "step": 2932, "loss": 0.6188063621520996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.390378" }, { "step": 2933, "loss": 0.9055655002593994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.474730" }, { "step": 2934, "loss": 0.6871058940887451, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.597494" }, { "step": 2935, "loss": 0.8897973895072937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.709492" }, { "step": 2936, "loss": 0.5880013704299927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.795224" }, { "step": 2937, "loss": 0.479616641998291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:37.912770" }, { "step": 2938, "loss": 0.7683265209197998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.029397" }, { "step": 2939, "loss": 0.9999301433563232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.144991" }, { "step": 2940, "loss": 0.744512677192688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.238489" }, { "step": 2941, "loss": 0.6929820775985718, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.324232" }, { "step": 2942, "loss": 0.636521577835083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.416852" }, { "step": 2943, "loss": 0.4294782876968384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.510502" }, { "step": 2944, "loss": 0.8073617219924927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.628647" }, { "step": 2945, "loss": 0.754601240158081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.714141" }, { "step": 2946, "loss": 0.7958248853683472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.825563" }, { "step": 2947, "loss": 0.5025470852851868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:38.923011" }, { "step": 2948, "loss": 0.9971753358840942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.017055" }, { "step": 2949, "loss": 0.7660197615623474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.107925" }, { "step": 2950, "loss": 0.6017042398452759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.192460" }, { "step": 2951, "loss": 0.5896728038787842, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.290876" }, { "step": 2952, "loss": 0.6781872510910034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.378216" }, { "step": 2953, "loss": 0.978561282157898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.521250" }, { "step": 2954, "loss": 0.7663436532020569, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.607484" }, { "step": 2955, "loss": 0.7339932918548584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.694244" }, { "step": 2956, "loss": 0.8805321455001831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.819570" }, { "step": 2957, "loss": 0.5551884174346924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:39.914497" }, { "step": 2958, "loss": 0.6848639249801636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.025418" }, { "step": 2959, "loss": 0.7219468355178833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.116537" }, { "step": 2960, "loss": 1.0961551666259766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.222251" }, { "step": 2961, "loss": 0.6448416113853455, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.307801" }, { "step": 2962, "loss": 0.9449483156204224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.394375" }, { "step": 2963, "loss": 0.7770485281944275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.483790" }, { "step": 2964, "loss": 0.6591987609863281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.581366" }, { "step": 2965, "loss": 0.7035844922065735, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.672138" }, { "step": 2966, "loss": 0.7948017716407776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.764962" }, { "step": 2967, "loss": 0.3833720088005066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.857000" }, { "step": 2968, "loss": 0.6763567328453064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:40.949750" }, { "step": 2969, "loss": 0.5635265111923218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.036960" }, { "step": 2970, "loss": 0.5668124556541443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.130776" }, { "step": 2971, "loss": 0.9717154502868652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.239423" }, { "step": 2972, "loss": 0.8395825028419495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.332691" }, { "step": 2973, "loss": 0.35927852988243103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.420628" }, { "step": 2974, "loss": 0.8057406544685364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.537940" }, { "step": 2975, "loss": 0.8148016929626465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.623782" }, { "step": 2976, "loss": 0.806751012802124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.719465" }, { "step": 2977, "loss": 0.7771547436714172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.808275" }, { "step": 2978, "loss": 0.6926621198654175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.899758" }, { "step": 2979, "loss": 0.8201907277107239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:41.986607" }, { "step": 2980, "loss": 0.41305050253868103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.073137" }, { "step": 2981, "loss": 0.5846246480941772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.173003" }, { "step": 2982, "loss": 0.5661888122558594, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.264986" }, { "step": 2983, "loss": 0.4795793294906616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.350332" }, { "step": 2984, "loss": 0.8065694570541382, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.445965" }, { "step": 2985, "loss": 0.5277481079101562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.530605" }, { "step": 2986, "loss": 0.5197981595993042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.624880" }, { "step": 2987, "loss": 0.8714021444320679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.717850" }, { "step": 2988, "loss": 0.8044940233230591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.816101" }, { "step": 2989, "loss": 0.8242455720901489, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.908715" }, { "step": 2990, "loss": 0.576938271522522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:42.996068" }, { "step": 2991, "loss": 0.683268666267395, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.107052" }, { "step": 2992, "loss": 0.99819016456604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.210681" }, { "step": 2993, "loss": 0.6284622550010681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.301523" }, { "step": 2994, "loss": 0.5702928304672241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.394184" }, { "step": 2995, "loss": 0.5061267018318176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.486108" }, { "step": 2996, "loss": 0.7529368996620178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.574003" }, { "step": 2997, "loss": 0.6810807585716248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.663695" }, { "step": 2998, "loss": 0.5909476280212402, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.759205" }, { "step": 2999, "loss": 0.6685561537742615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.852698" }, { "step": 3000, "loss": 0.9648053646087646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:29:43.943633" }, { "step": 3001, "loss": 0.9805135726928711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:06.575498" }, { "step": 3002, "loss": 0.501151978969574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:06.671697" }, { "step": 3003, "loss": 0.9174951314926147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:06.773512" }, { "step": 3004, "loss": 0.5940431356430054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:06.889408" }, { "step": 3005, "loss": 0.839946985244751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:06.976863" }, { "step": 3006, "loss": 0.8507363796234131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.068767" }, { "step": 3007, "loss": 0.9616976976394653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.153585" }, { "step": 3008, "loss": 0.8954578638076782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.244669" }, { "step": 3009, "loss": 0.5576778650283813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.336760" }, { "step": 3010, "loss": 0.5665724873542786, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.429787" }, { "step": 3011, "loss": 0.6128925085067749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.529976" }, { "step": 3012, "loss": 0.6412845849990845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.617574" }, { "step": 3013, "loss": 0.7503130435943604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.703506" }, { "step": 3014, "loss": 1.1152994632720947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.790706" }, { "step": 3015, "loss": 0.9724318385124207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.883587" }, { "step": 3016, "loss": 0.4749130606651306, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:07.989831" }, { "step": 3017, "loss": 1.042256474494934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.082141" }, { "step": 3018, "loss": 0.7291653156280518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.174367" }, { "step": 3019, "loss": 0.9275494813919067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.294327" }, { "step": 3020, "loss": 0.47083163261413574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.391297" }, { "step": 3021, "loss": 1.0753037929534912, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.528849" }, { "step": 3022, "loss": 0.7099695205688477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.646037" }, { "step": 3023, "loss": 0.8354144096374512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.791649" }, { "step": 3024, "loss": 1.0304509401321411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.889158" }, { "step": 3025, "loss": 0.6055278778076172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:08.982692" }, { "step": 3026, "loss": 0.6935775279998779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.107135" }, { "step": 3027, "loss": 0.7401977181434631, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.224449" }, { "step": 3028, "loss": 0.5569331645965576, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.308535" }, { "step": 3029, "loss": 1.5404268503189087, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.394464" }, { "step": 3030, "loss": 0.9184237718582153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.479941" }, { "step": 3031, "loss": 1.2896469831466675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.564218" }, { "step": 3032, "loss": 0.7349753975868225, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.650421" }, { "step": 3033, "loss": 0.400424063205719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.741223" }, { "step": 3034, "loss": 0.584333598613739, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.836061" }, { "step": 3035, "loss": 0.7202877998352051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:09.927207" }, { "step": 3036, "loss": 0.6643348932266235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.045590" }, { "step": 3037, "loss": 1.0133179426193237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.169351" }, { "step": 3038, "loss": 0.8102070689201355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.281719" }, { "step": 3039, "loss": 0.7073261141777039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.399604" }, { "step": 3040, "loss": 0.8126324415206909, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.521730" }, { "step": 3041, "loss": 0.8746421337127686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.619656" }, { "step": 3042, "loss": 0.7138792872428894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.738518" }, { "step": 3043, "loss": 0.8544684052467346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.830022" }, { "step": 3044, "loss": 1.115713119506836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:10.939225" }, { "step": 3045, "loss": 0.9254186153411865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.050263" }, { "step": 3046, "loss": 0.7348741888999939, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.143048" }, { "step": 3047, "loss": 0.7529674768447876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.232150" }, { "step": 3048, "loss": 1.103926420211792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.319555" }, { "step": 3049, "loss": 0.6438760757446289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.421098" }, { "step": 3050, "loss": 0.5635496973991394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.514116" }, { "step": 3051, "loss": 0.8631874322891235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.625602" }, { "step": 3052, "loss": 0.6754119396209717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.725422" }, { "step": 3053, "loss": 0.6170694828033447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.819793" }, { "step": 3054, "loss": 0.7282772064208984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:11.911158" }, { "step": 3055, "loss": 1.261899709701538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.024953" }, { "step": 3056, "loss": 0.5550755262374878, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.115783" }, { "step": 3057, "loss": 0.7105146050453186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.204747" }, { "step": 3058, "loss": 0.7564438581466675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.291451" }, { "step": 3059, "loss": 0.8576802611351013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.376704" }, { "step": 3060, "loss": 0.4365670084953308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.469882" }, { "step": 3061, "loss": 0.6835899353027344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.565150" }, { "step": 3062, "loss": 0.6810494065284729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.659785" }, { "step": 3063, "loss": 0.7478222846984863, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.745678" }, { "step": 3064, "loss": 0.6957106590270996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.845381" }, { "step": 3065, "loss": 0.942913293838501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:12.959186" }, { "step": 3066, "loss": 0.45282405614852905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.058657" }, { "step": 3067, "loss": 0.7769769430160522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.173251" }, { "step": 3068, "loss": 0.4644858241081238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.265311" }, { "step": 3069, "loss": 0.6380125880241394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.364310" }, { "step": 3070, "loss": 0.8456429243087769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.480431" }, { "step": 3071, "loss": 0.7565112113952637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.567299" }, { "step": 3072, "loss": 0.42182108759880066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.653179" }, { "step": 3073, "loss": 0.4376131296157837, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.744905" }, { "step": 3074, "loss": 0.756783664226532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.861146" }, { "step": 3075, "loss": 0.9284956455230713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:13.971115" }, { "step": 3076, "loss": 0.6386061906814575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.063835" }, { "step": 3077, "loss": 0.6654310822486877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.156699" }, { "step": 3078, "loss": 0.6955143809318542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.251303" }, { "step": 3079, "loss": 0.5810842514038086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.343182" }, { "step": 3080, "loss": 0.8800133466720581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.435405" }, { "step": 3081, "loss": 0.3649836778640747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.521852" }, { "step": 3082, "loss": 0.9126920700073242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.640603" }, { "step": 3083, "loss": 0.5018119215965271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.734760" }, { "step": 3084, "loss": 0.44410187005996704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.825566" }, { "step": 3085, "loss": 1.0078314542770386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:14.940105" }, { "step": 3086, "loss": 0.6567389369010925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.028181" }, { "step": 3087, "loss": 0.688673734664917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.128567" }, { "step": 3088, "loss": 0.5504109263420105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.220449" }, { "step": 3089, "loss": 0.7390774488449097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.329717" }, { "step": 3090, "loss": 0.7542642951011658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.423784" }, { "step": 3091, "loss": 0.6794458627700806, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.547629" }, { "step": 3092, "loss": 0.7504497170448303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.657886" }, { "step": 3093, "loss": 0.8983004093170166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.768574" }, { "step": 3094, "loss": 0.5185648202896118, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.853809" }, { "step": 3095, "loss": 0.7121344208717346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:15.942764" }, { "step": 3096, "loss": 0.741154134273529, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.027045" }, { "step": 3097, "loss": 0.8137518167495728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.121834" }, { "step": 3098, "loss": 0.862762987613678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.209421" }, { "step": 3099, "loss": 0.9524462223052979, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.321103" }, { "step": 3100, "loss": 0.7641392946243286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.406570" }, { "step": 3101, "loss": 0.8009275197982788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.522942" }, { "step": 3102, "loss": 0.9935872554779053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.634438" }, { "step": 3103, "loss": 0.9685931205749512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.719481" }, { "step": 3104, "loss": 0.6979647874832153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.804902" }, { "step": 3105, "loss": 0.806624174118042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.899434" }, { "step": 3106, "loss": 0.7881092429161072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:16.991523" }, { "step": 3107, "loss": 0.7634115815162659, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.087067" }, { "step": 3108, "loss": 0.8897393345832825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.182432" }, { "step": 3109, "loss": 0.29650163650512695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.270894" }, { "step": 3110, "loss": 0.7727733254432678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.356829" }, { "step": 3111, "loss": 0.5910601615905762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.455512" }, { "step": 3112, "loss": 0.819779634475708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.559486" }, { "step": 3113, "loss": 0.7032309770584106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.669758" }, { "step": 3114, "loss": 0.840410053730011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.761489" }, { "step": 3115, "loss": 0.9125518798828125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.855848" }, { "step": 3116, "loss": 0.7666575312614441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:17.969363" }, { "step": 3117, "loss": 0.5673443675041199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.053411" }, { "step": 3118, "loss": 0.4937063157558441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.145555" }, { "step": 3119, "loss": 0.4939037561416626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.231353" }, { "step": 3120, "loss": 1.0518746376037598, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.326256" }, { "step": 3121, "loss": 0.9037171602249146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.412901" }, { "step": 3122, "loss": 0.6544389128684998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.497906" }, { "step": 3123, "loss": 0.8583559989929199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.589691" }, { "step": 3124, "loss": 0.9024344682693481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.675649" }, { "step": 3125, "loss": 0.8224021196365356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.765056" }, { "step": 3126, "loss": 0.9537413120269775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.853618" }, { "step": 3127, "loss": 0.8202701210975647, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:18.941683" }, { "step": 3128, "loss": 0.4655417799949646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.033336" }, { "step": 3129, "loss": 0.7449212670326233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.125000" }, { "step": 3130, "loss": 0.6462110877037048, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.209701" }, { "step": 3131, "loss": 0.6375960111618042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.299047" }, { "step": 3132, "loss": 0.7445585131645203, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.385575" }, { "step": 3133, "loss": 0.6389011144638062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.470245" }, { "step": 3134, "loss": 0.5230859518051147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.560112" }, { "step": 3135, "loss": 0.6139276623725891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.650095" }, { "step": 3136, "loss": 0.7262135744094849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.737464" }, { "step": 3137, "loss": 0.7788594961166382, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.828139" }, { "step": 3138, "loss": 0.7317264080047607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:19.918370" }, { "step": 3139, "loss": 1.0542404651641846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.040128" }, { "step": 3140, "loss": 0.5679299831390381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.144711" }, { "step": 3141, "loss": 0.6864079236984253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.261550" }, { "step": 3142, "loss": 0.5572327971458435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.356140" }, { "step": 3143, "loss": 0.8730728626251221, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.472279" }, { "step": 3144, "loss": 0.5637379884719849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.569132" }, { "step": 3145, "loss": 0.7062610983848572, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.667745" }, { "step": 3146, "loss": 0.42234450578689575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.759980" }, { "step": 3147, "loss": 0.5159710049629211, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.852523" }, { "step": 3148, "loss": 1.1041570901870728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:20.943856" }, { "step": 3149, "loss": 0.6372393369674683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.045466" }, { "step": 3150, "loss": 1.1083418130874634, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.141258" }, { "step": 3151, "loss": 0.9783831834793091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.228370" }, { "step": 3152, "loss": 0.6280320882797241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.330312" }, { "step": 3153, "loss": 0.8681676387786865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.419278" }, { "step": 3154, "loss": 0.6604915261268616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.511954" }, { "step": 3155, "loss": 0.5028591156005859, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.601617" }, { "step": 3156, "loss": 0.6180320978164673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.718782" }, { "step": 3157, "loss": 0.8087215423583984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.809005" }, { "step": 3158, "loss": 0.6777383089065552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:21.930882" }, { "step": 3159, "loss": 0.7281546592712402, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.019490" }, { "step": 3160, "loss": 0.6736454963684082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.111296" }, { "step": 3161, "loss": 0.9830069541931152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.195993" }, { "step": 3162, "loss": 0.5862903594970703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.313262" }, { "step": 3163, "loss": 0.40392306447029114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.398826" }, { "step": 3164, "loss": 0.6801989078521729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.517031" }, { "step": 3165, "loss": 0.7722682952880859, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.630258" }, { "step": 3166, "loss": 0.36972135305404663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.726221" }, { "step": 3167, "loss": 0.9538811445236206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.808933" }, { "step": 3168, "loss": 0.8485324382781982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.901950" }, { "step": 3169, "loss": 0.5764671564102173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:22.994876" }, { "step": 3170, "loss": 1.0854945182800293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.081821" }, { "step": 3171, "loss": 1.0815273523330688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.172252" }, { "step": 3172, "loss": 0.6788411736488342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.258894" }, { "step": 3173, "loss": 1.0269510746002197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.366161" }, { "step": 3174, "loss": 0.8620308041572571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.459375" }, { "step": 3175, "loss": 0.7269145250320435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.549099" }, { "step": 3176, "loss": 0.6917524337768555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.648976" }, { "step": 3177, "loss": 0.792110800743103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.733946" }, { "step": 3178, "loss": 0.8119210004806519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.840291" }, { "step": 3179, "loss": 0.941260576248169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:23.925416" }, { "step": 3180, "loss": 0.7359766364097595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.010408" }, { "step": 3181, "loss": 0.5123286247253418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.106004" }, { "step": 3182, "loss": 0.8364824056625366, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.198314" }, { "step": 3183, "loss": 0.8368743658065796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.293072" }, { "step": 3184, "loss": 0.7790253162384033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.405817" }, { "step": 3185, "loss": 0.7074493169784546, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.495904" }, { "step": 3186, "loss": 0.4472644031047821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.590270" }, { "step": 3187, "loss": 0.6493406891822815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.687133" }, { "step": 3188, "loss": 0.6939192414283752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.772426" }, { "step": 3189, "loss": 0.6530179977416992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.857965" }, { "step": 3190, "loss": 1.0823748111724854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:24.974686" }, { "step": 3191, "loss": 0.6571548581123352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.062327" }, { "step": 3192, "loss": 0.7007577419281006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.149114" }, { "step": 3193, "loss": 0.7868717908859253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.257862" }, { "step": 3194, "loss": 0.6737204790115356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.345711" }, { "step": 3195, "loss": 0.7109578251838684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.443347" }, { "step": 3196, "loss": 0.44007110595703125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.535352" }, { "step": 3197, "loss": 0.9133606553077698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.623276" }, { "step": 3198, "loss": 0.9143474102020264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.709348" }, { "step": 3199, "loss": 0.5409735441207886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.802184" }, { "step": 3200, "loss": 0.5694776177406311, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:25.930207" }, { "step": 3201, "loss": 0.5412457585334778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.017007" }, { "step": 3202, "loss": 0.8244484066963196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.101239" }, { "step": 3203, "loss": 0.7138899564743042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.187135" }, { "step": 3204, "loss": 0.5174521803855896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.279625" }, { "step": 3205, "loss": 1.0250258445739746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.389678" }, { "step": 3206, "loss": 0.9231112003326416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.473525" }, { "step": 3207, "loss": 0.4580802023410797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.563472" }, { "step": 3208, "loss": 0.706415057182312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.654809" }, { "step": 3209, "loss": 0.9045460224151611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.744255" }, { "step": 3210, "loss": 0.39070925116539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.843699" }, { "step": 3211, "loss": 0.8224180936813354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:26.948790" }, { "step": 3212, "loss": 0.6694439053535461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.037872" }, { "step": 3213, "loss": 0.3985706567764282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.130856" }, { "step": 3214, "loss": 0.5749392509460449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.234415" }, { "step": 3215, "loss": 0.6819666028022766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.352406" }, { "step": 3216, "loss": 0.9452817440032959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.473339" }, { "step": 3217, "loss": 0.8062852621078491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.564877" }, { "step": 3218, "loss": 0.45746028423309326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.653498" }, { "step": 3219, "loss": 0.6794825792312622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.738174" }, { "step": 3220, "loss": 0.6394520998001099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.830488" }, { "step": 3221, "loss": 0.9610781669616699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:27.949627" }, { "step": 3222, "loss": 0.7870481014251709, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.044136" }, { "step": 3223, "loss": 0.6023524403572083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.129475" }, { "step": 3224, "loss": 0.679192304611206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.239357" }, { "step": 3225, "loss": 0.7376857995986938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.333084" }, { "step": 3226, "loss": 0.4379594326019287, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.426629" }, { "step": 3227, "loss": 0.8599427938461304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.519801" }, { "step": 3228, "loss": 0.7263824939727783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.613501" }, { "step": 3229, "loss": 0.7730405926704407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.704802" }, { "step": 3230, "loss": 0.9265391230583191, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.817564" }, { "step": 3231, "loss": 0.8509201407432556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.902570" }, { "step": 3232, "loss": 0.9844202995300293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:28.988183" }, { "step": 3233, "loss": 0.8701931238174438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.072853" }, { "step": 3234, "loss": 0.7149703502655029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.189748" }, { "step": 3235, "loss": 0.7420458793640137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.280890" }, { "step": 3236, "loss": 0.5729456543922424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.378938" }, { "step": 3237, "loss": 0.47160804271698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.463876" }, { "step": 3238, "loss": 0.44341057538986206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.552040" }, { "step": 3239, "loss": 0.8949050903320312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.661891" }, { "step": 3240, "loss": 1.1488797664642334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.758370" }, { "step": 3241, "loss": 0.6367141604423523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.848992" }, { "step": 3242, "loss": 0.9476053714752197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:29.959026" }, { "step": 3243, "loss": 1.0429589748382568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.045545" }, { "step": 3244, "loss": 0.7084981203079224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.168858" }, { "step": 3245, "loss": 0.8637794256210327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.261180" }, { "step": 3246, "loss": 0.39634618163108826, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.354096" }, { "step": 3247, "loss": 0.5115682482719421, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.443564" }, { "step": 3248, "loss": 0.9106144905090332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.530434" }, { "step": 3249, "loss": 0.7793893218040466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.657137" }, { "step": 3250, "loss": 0.8147534132003784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.753419" }, { "step": 3251, "loss": 0.9374070167541504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.863877" }, { "step": 3252, "loss": 0.565058171749115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:30.956659" }, { "step": 3253, "loss": 0.5448878407478333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.049587" }, { "step": 3254, "loss": 0.7819275856018066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.141364" }, { "step": 3255, "loss": 1.1723284721374512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.230721" }, { "step": 3256, "loss": 0.9482029676437378, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.382054" }, { "step": 3257, "loss": 0.8097343444824219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.469457" }, { "step": 3258, "loss": 0.9912012815475464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.578387" }, { "step": 3259, "loss": 1.013709306716919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.664898" }, { "step": 3260, "loss": 0.6878746151924133, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.754484" }, { "step": 3261, "loss": 0.659705400466919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.838651" }, { "step": 3262, "loss": 0.7861377000808716, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:31.956687" }, { "step": 3263, "loss": 0.3514382541179657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.051562" }, { "step": 3264, "loss": 0.7164840698242188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.142836" }, { "step": 3265, "loss": 0.7585687041282654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.257208" }, { "step": 3266, "loss": 0.93060702085495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.347053" }, { "step": 3267, "loss": 0.6551715135574341, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.440819" }, { "step": 3268, "loss": 0.8253731727600098, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.557326" }, { "step": 3269, "loss": 0.8118700981140137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.648116" }, { "step": 3270, "loss": 0.7092741131782532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.737072" }, { "step": 3271, "loss": 0.8516911268234253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.824885" }, { "step": 3272, "loss": 1.0336393117904663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:32.931784" }, { "step": 3273, "loss": 0.5220339298248291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.023234" }, { "step": 3274, "loss": 0.6169244050979614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.112601" }, { "step": 3275, "loss": 0.5392110347747803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.198387" }, { "step": 3276, "loss": 1.1895697116851807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.284973" }, { "step": 3277, "loss": 0.8159258365631104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.372941" }, { "step": 3278, "loss": 0.9245014190673828, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.457285" }, { "step": 3279, "loss": 0.8026454448699951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.549363" }, { "step": 3280, "loss": 0.45132380723953247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.641673" }, { "step": 3281, "loss": 0.5423135161399841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.734978" }, { "step": 3282, "loss": 0.6178992986679077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.850759" }, { "step": 3283, "loss": 0.5004984736442566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:33.940477" }, { "step": 3284, "loss": 0.8610962629318237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.059401" }, { "step": 3285, "loss": 0.705467700958252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.150520" }, { "step": 3286, "loss": 0.8266055583953857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.258757" }, { "step": 3287, "loss": 0.6286271214485168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.343609" }, { "step": 3288, "loss": 0.7417175769805908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.431414" }, { "step": 3289, "loss": 0.9366861581802368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.525693" }, { "step": 3290, "loss": 0.6631477475166321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.649960" }, { "step": 3291, "loss": 0.8264108896255493, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.742275" }, { "step": 3292, "loss": 0.49946141242980957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.827921" }, { "step": 3293, "loss": 0.8233369588851929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:34.928823" }, { "step": 3294, "loss": 0.811164379119873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.019209" }, { "step": 3295, "loss": 0.9874475598335266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.104376" }, { "step": 3296, "loss": 0.795071542263031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.192337" }, { "step": 3297, "loss": 0.5120899677276611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.277423" }, { "step": 3298, "loss": 0.4160255789756775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.367871" }, { "step": 3299, "loss": 0.6404533982276917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.453027" }, { "step": 3300, "loss": 0.9878014326095581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.549068" }, { "step": 3301, "loss": 0.467906653881073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.647708" }, { "step": 3302, "loss": 0.9505558013916016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.735342" }, { "step": 3303, "loss": 0.5349616408348083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.824932" }, { "step": 3304, "loss": 0.8259149789810181, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:35.935094" }, { "step": 3305, "loss": 0.876760721206665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.020054" }, { "step": 3306, "loss": 0.6104738712310791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.115148" }, { "step": 3307, "loss": 0.8237457275390625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.200609" }, { "step": 3308, "loss": 0.8434017896652222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.293119" }, { "step": 3309, "loss": 0.8109836578369141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.378304" }, { "step": 3310, "loss": 0.6026668548583984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.466637" }, { "step": 3311, "loss": 0.6385618448257446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.556442" }, { "step": 3312, "loss": 0.8602007627487183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.662351" }, { "step": 3313, "loss": 0.6122464537620544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.748206" }, { "step": 3314, "loss": 0.4577614665031433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.835547" }, { "step": 3315, "loss": 0.5747810006141663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:36.921150" }, { "step": 3316, "loss": 0.8799399137496948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.030247" }, { "step": 3317, "loss": 0.6983466744422913, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.120265" }, { "step": 3318, "loss": 0.831936240196228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.205622" }, { "step": 3319, "loss": 0.45395463705062866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.295934" }, { "step": 3320, "loss": 0.7425445914268494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.382508" }, { "step": 3321, "loss": 0.7475301027297974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.481808" }, { "step": 3322, "loss": 0.5225805640220642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.567838" }, { "step": 3323, "loss": 0.8752028942108154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.657123" }, { "step": 3324, "loss": 0.5792776942253113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.743198" }, { "step": 3325, "loss": 1.0326966047286987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.829727" }, { "step": 3326, "loss": 0.7152256369590759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:37.951078" }, { "step": 3327, "loss": 0.4295559823513031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.035945" }, { "step": 3328, "loss": 0.4275209903717041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.121898" }, { "step": 3329, "loss": 0.6933001279830933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.232910" }, { "step": 3330, "loss": 0.5650151371955872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.318201" }, { "step": 3331, "loss": 0.5935956835746765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.421865" }, { "step": 3332, "loss": 0.5269439816474915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.512322" }, { "step": 3333, "loss": 0.5335818529129028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.607350" }, { "step": 3334, "loss": 0.9066001176834106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.692000" }, { "step": 3335, "loss": 0.7437013387680054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.811433" }, { "step": 3336, "loss": 0.5018743872642517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:38.917908" }, { "step": 3337, "loss": 1.2715797424316406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.035664" }, { "step": 3338, "loss": 0.7444844245910645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.150849" }, { "step": 3339, "loss": 1.009781002998352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.266839" }, { "step": 3340, "loss": 1.0889286994934082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.354976" }, { "step": 3341, "loss": 1.189896583557129, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.462558" }, { "step": 3342, "loss": 0.681369423866272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.550748" }, { "step": 3343, "loss": 0.8867378234863281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.636083" }, { "step": 3344, "loss": 0.5701128840446472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.731319" }, { "step": 3345, "loss": 0.7483645081520081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.824550" }, { "step": 3346, "loss": 0.6193416118621826, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.912118" }, { "step": 3347, "loss": 0.797339916229248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:39.998383" }, { "step": 3348, "loss": 0.9155876636505127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.084527" }, { "step": 3349, "loss": 0.3824477195739746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.170712" }, { "step": 3350, "loss": 0.7221134901046753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.265792" }, { "step": 3351, "loss": 0.7902415990829468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.377125" }, { "step": 3352, "loss": 0.4860917925834656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.470039" }, { "step": 3353, "loss": 0.944553017616272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.562080" }, { "step": 3354, "loss": 0.8704984188079834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.681093" }, { "step": 3355, "loss": 0.8614016771316528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.793327" }, { "step": 3356, "loss": 0.7257476449012756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.885264" }, { "step": 3357, "loss": 0.7167946100234985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:40.995689" }, { "step": 3358, "loss": 0.7995426058769226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.085037" }, { "step": 3359, "loss": 0.8083840608596802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.170888" }, { "step": 3360, "loss": 0.763662576675415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.278693" }, { "step": 3361, "loss": 0.6566978693008423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.365248" }, { "step": 3362, "loss": 0.6720725893974304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.459184" }, { "step": 3363, "loss": 0.7387163639068604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.545511" }, { "step": 3364, "loss": 0.858155369758606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.633720" }, { "step": 3365, "loss": 0.7551475167274475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.755479" }, { "step": 3366, "loss": 0.3907164931297302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.845860" }, { "step": 3367, "loss": 0.7711496353149414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:41.946316" }, { "step": 3368, "loss": 0.3771726191043854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.031343" }, { "step": 3369, "loss": 0.8176953792572021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.151950" }, { "step": 3370, "loss": 0.5747708082199097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.243799" }, { "step": 3371, "loss": 0.9786981344223022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.358203" }, { "step": 3372, "loss": 0.5959408283233643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.465629" }, { "step": 3373, "loss": 0.44812673330307007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.560930" }, { "step": 3374, "loss": 0.6525132060050964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.674195" }, { "step": 3375, "loss": 0.6794662475585938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.759875" }, { "step": 3376, "loss": 0.8298093676567078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.850458" }, { "step": 3377, "loss": 0.7810841798782349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:42.965862" }, { "step": 3378, "loss": 0.6052488088607788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.057882" }, { "step": 3379, "loss": 0.8497422933578491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.159036" }, { "step": 3380, "loss": 0.5143412351608276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.250133" }, { "step": 3381, "loss": 0.7647193670272827, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.334962" }, { "step": 3382, "loss": 0.44683194160461426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.432588" }, { "step": 3383, "loss": 0.698976993560791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.523659" }, { "step": 3384, "loss": 0.7907758951187134, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.631816" }, { "step": 3385, "loss": 0.6356850862503052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.750267" }, { "step": 3386, "loss": 0.6207312345504761, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.835064" }, { "step": 3387, "loss": 0.7772262692451477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:43.942842" }, { "step": 3388, "loss": 0.6971580982208252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.059518" }, { "step": 3389, "loss": 0.529020369052887, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.154878" }, { "step": 3390, "loss": 0.4354517161846161, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.248673" }, { "step": 3391, "loss": 0.7470306158065796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.340965" }, { "step": 3392, "loss": 0.570461630821228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.435712" }, { "step": 3393, "loss": 0.5926608443260193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.520120" }, { "step": 3394, "loss": 0.6391808390617371, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.613944" }, { "step": 3395, "loss": 0.8208524584770203, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.700458" }, { "step": 3396, "loss": 0.6877185702323914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.793689" }, { "step": 3397, "loss": 0.9924322366714478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.906651" }, { "step": 3398, "loss": 0.9547948837280273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:44.993314" }, { "step": 3399, "loss": 1.0328933000564575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.088165" }, { "step": 3400, "loss": 1.149420976638794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.176004" }, { "step": 3401, "loss": 0.8392502069473267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.268089" }, { "step": 3402, "loss": 0.7767413854598999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.374996" }, { "step": 3403, "loss": 0.4352242052555084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.460557" }, { "step": 3404, "loss": 0.7701349854469299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.547307" }, { "step": 3405, "loss": 0.4520123600959778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.632776" }, { "step": 3406, "loss": 1.0020418167114258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.720539" }, { "step": 3407, "loss": 0.8010259866714478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.834447" }, { "step": 3408, "loss": 0.6659966707229614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:45.920562" }, { "step": 3409, "loss": 0.4351460933685303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.011351" }, { "step": 3410, "loss": 0.7746903896331787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.119716" }, { "step": 3411, "loss": 0.6605627536773682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.219530" }, { "step": 3412, "loss": 0.4825456738471985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.313495" }, { "step": 3413, "loss": 0.9220658540725708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.399199" }, { "step": 3414, "loss": 0.7557275891304016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.489012" }, { "step": 3415, "loss": 0.828728437423706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.576491" }, { "step": 3416, "loss": 0.559532642364502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.669107" }, { "step": 3417, "loss": 1.0110080242156982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.786028" }, { "step": 3418, "loss": 0.7193533182144165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.878025" }, { "step": 3419, "loss": 0.8213282823562622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:46.978447" }, { "step": 3420, "loss": 0.5489025712013245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.063062" }, { "step": 3421, "loss": 0.9064726829528809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.174294" }, { "step": 3422, "loss": 0.7447773218154907, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.272568" }, { "step": 3423, "loss": 1.0442607402801514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.366983" }, { "step": 3424, "loss": 0.704194962978363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.452139" }, { "step": 3425, "loss": 0.6755774021148682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.567266" }, { "step": 3426, "loss": 0.9681968092918396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.686622" }, { "step": 3427, "loss": 0.8948537111282349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.772520" }, { "step": 3428, "loss": 0.653038740158081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.884364" }, { "step": 3429, "loss": 0.44834789633750916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:47.970852" }, { "step": 3430, "loss": 0.7989956736564636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.056302" }, { "step": 3431, "loss": 0.6193897724151611, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.141704" }, { "step": 3432, "loss": 0.5457963943481445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.232298" }, { "step": 3433, "loss": 0.5163199305534363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.325377" }, { "step": 3434, "loss": 0.8119064569473267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.419973" }, { "step": 3435, "loss": 0.6751782894134521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.528886" }, { "step": 3436, "loss": 1.05290687084198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.622013" }, { "step": 3437, "loss": 0.7577234506607056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.715861" }, { "step": 3438, "loss": 0.9602457284927368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.804246" }, { "step": 3439, "loss": 0.8241970539093018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:48.894684" }, { "step": 3440, "loss": 0.7511780261993408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.012363" }, { "step": 3441, "loss": 0.22324907779693604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.097931" }, { "step": 3442, "loss": 1.1614620685577393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.185241" }, { "step": 3443, "loss": 0.6445930004119873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.278030" }, { "step": 3444, "loss": 0.7855455875396729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.382222" }, { "step": 3445, "loss": 0.5877750515937805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.470080" }, { "step": 3446, "loss": 0.40608611702919006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.558199" }, { "step": 3447, "loss": 0.7691845297813416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.652159" }, { "step": 3448, "loss": 0.82719886302948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.745380" }, { "step": 3449, "loss": 0.5825662612915039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.841000" }, { "step": 3450, "loss": 0.678838849067688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:49.927323" }, { "step": 3451, "loss": 0.8377180695533752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.040417" }, { "step": 3452, "loss": 0.5939214825630188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.144638" }, { "step": 3453, "loss": 0.7258152961730957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.232919" }, { "step": 3454, "loss": 0.8305908441543579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.318468" }, { "step": 3455, "loss": 0.4878830313682556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.403571" }, { "step": 3456, "loss": 0.6539267897605896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.502768" }, { "step": 3457, "loss": 0.6119465231895447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.612831" }, { "step": 3458, "loss": 1.0077780485153198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.700488" }, { "step": 3459, "loss": 0.4255276918411255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.792600" }, { "step": 3460, "loss": 0.323469340801239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:50.891534" }, { "step": 3461, "loss": 0.9350086450576782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.012788" }, { "step": 3462, "loss": 0.9594261646270752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.151950" }, { "step": 3463, "loss": 0.9098608493804932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.269255" }, { "step": 3464, "loss": 0.6238703727722168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.353640" }, { "step": 3465, "loss": 0.36003378033638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.438968" }, { "step": 3466, "loss": 0.5823748111724854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.526919" }, { "step": 3467, "loss": 0.4261472225189209, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.620919" }, { "step": 3468, "loss": 0.548007607460022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.710865" }, { "step": 3469, "loss": 0.507819652557373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.807520" }, { "step": 3470, "loss": 0.9762433767318726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:51.917021" }, { "step": 3471, "loss": 0.9304478168487549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.011554" }, { "step": 3472, "loss": 0.9657114744186401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.096742" }, { "step": 3473, "loss": 0.5974757671356201, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.188391" }, { "step": 3474, "loss": 0.6591046452522278, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.297466" }, { "step": 3475, "loss": 0.7011233568191528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.391845" }, { "step": 3476, "loss": 0.8830780982971191, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.513887" }, { "step": 3477, "loss": 0.9530991315841675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.619310" }, { "step": 3478, "loss": 0.7117260694503784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.705498" }, { "step": 3479, "loss": 0.6708883047103882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.789222" }, { "step": 3480, "loss": 0.7273404002189636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.880462" }, { "step": 3481, "loss": 0.6627192497253418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:52.971649" }, { "step": 3482, "loss": 0.6759431958198547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.060738" }, { "step": 3483, "loss": 1.265660047531128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.181735" }, { "step": 3484, "loss": 0.9033564329147339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.267051" }, { "step": 3485, "loss": 0.5786389112472534, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.353320" }, { "step": 3486, "loss": 0.8743953704833984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.460880" }, { "step": 3487, "loss": 0.6894832253456116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.556676" }, { "step": 3488, "loss": 0.8744434118270874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.669706" }, { "step": 3489, "loss": 0.5806879997253418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.764426" }, { "step": 3490, "loss": 0.7757110595703125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.848946" }, { "step": 3491, "loss": 0.8099993467330933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:53.935884" }, { "step": 3492, "loss": 1.0209382772445679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.037339" }, { "step": 3493, "loss": 0.7540505528450012, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.129144" }, { "step": 3494, "loss": 0.8701831102371216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.221008" }, { "step": 3495, "loss": 0.7802522778511047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.305919" }, { "step": 3496, "loss": 0.6256201267242432, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.399471" }, { "step": 3497, "loss": 0.6731424927711487, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.495212" }, { "step": 3498, "loss": 0.3049931526184082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.581041" }, { "step": 3499, "loss": 0.7152966856956482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.667263" }, { "step": 3500, "loss": 0.7844251394271851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:30:54.774799" }, { "step": 3501, "loss": 0.9832898378372192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:17.639949" }, { "step": 3502, "loss": 0.9729974865913391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:17.755464" }, { "step": 3503, "loss": 0.7991012930870056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:17.855775" }, { "step": 3504, "loss": 0.8398756980895996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:17.968254" }, { "step": 3505, "loss": 0.52554851770401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.061478" }, { "step": 3506, "loss": 0.4474533796310425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.148331" }, { "step": 3507, "loss": 0.4570484757423401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.241191" }, { "step": 3508, "loss": 0.4929822087287903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.325897" }, { "step": 3509, "loss": 0.54095059633255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.413450" }, { "step": 3510, "loss": 1.1051408052444458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.527770" }, { "step": 3511, "loss": 0.7205290794372559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.639526" }, { "step": 3512, "loss": 0.4946908950805664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.725639" }, { "step": 3513, "loss": 0.5748703479766846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.814645" }, { "step": 3514, "loss": 0.535889744758606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:18.907760" }, { "step": 3515, "loss": 0.779205858707428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.028099" }, { "step": 3516, "loss": 0.9895452260971069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.134823" }, { "step": 3517, "loss": 0.6768277883529663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.223517" }, { "step": 3518, "loss": 0.601672351360321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.309361" }, { "step": 3519, "loss": 0.5467623472213745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.403490" }, { "step": 3520, "loss": 0.5625637769699097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.497092" }, { "step": 3521, "loss": 0.5397733449935913, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.589120" }, { "step": 3522, "loss": 0.9190055131912231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.683518" }, { "step": 3523, "loss": 0.9532109498977661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.777763" }, { "step": 3524, "loss": 1.1730554103851318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.892439" }, { "step": 3525, "loss": 0.5637879371643066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:19.984738" }, { "step": 3526, "loss": 0.4095139503479004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.076623" }, { "step": 3527, "loss": 0.5177748799324036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.159294" }, { "step": 3528, "loss": 0.6642892360687256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.247900" }, { "step": 3529, "loss": 0.8354084491729736, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.366649" }, { "step": 3530, "loss": 0.4918149709701538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.455482" }, { "step": 3531, "loss": 0.7736240029335022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.544225" }, { "step": 3532, "loss": 0.5928648710250854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.629895" }, { "step": 3533, "loss": 0.7837066650390625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.716674" }, { "step": 3534, "loss": 0.8714853525161743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.807471" }, { "step": 3535, "loss": 0.7670563459396362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:20.900857" }, { "step": 3536, "loss": 1.1406360864639282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.013445" }, { "step": 3537, "loss": 0.7800382375717163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.135426" }, { "step": 3538, "loss": 0.689795970916748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.227503" }, { "step": 3539, "loss": 1.05343496799469, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.342779" }, { "step": 3540, "loss": 0.9207431077957153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.453392" }, { "step": 3541, "loss": 1.0432119369506836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.540529" }, { "step": 3542, "loss": 0.7482895851135254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.666211" }, { "step": 3543, "loss": 0.9921121001243591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.756236" }, { "step": 3544, "loss": 1.146081805229187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.870423" }, { "step": 3545, "loss": 0.5389232039451599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:21.969905" }, { "step": 3546, "loss": 0.9371793270111084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.057935" }, { "step": 3547, "loss": 1.0200493335723877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.169264" }, { "step": 3548, "loss": 0.5338776707649231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.261291" }, { "step": 3549, "loss": 0.5657249689102173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.348230" }, { "step": 3550, "loss": 0.5648197531700134, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.432930" }, { "step": 3551, "loss": 0.4725416898727417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.519038" }, { "step": 3552, "loss": 0.6069210767745972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.607093" }, { "step": 3553, "loss": 0.5097184181213379, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.724082" }, { "step": 3554, "loss": 0.5466295480728149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.819414" }, { "step": 3555, "loss": 0.9454019069671631, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.904707" }, { "step": 3556, "loss": 0.9076260328292847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:22.999330" }, { "step": 3557, "loss": 0.5618622899055481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.083959" }, { "step": 3558, "loss": 0.9696615934371948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.193332" }, { "step": 3559, "loss": 0.4915342330932617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.289942" }, { "step": 3560, "loss": 0.7397376894950867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.382543" }, { "step": 3561, "loss": 0.6493360996246338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.474581" }, { "step": 3562, "loss": 0.9390573501586914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.593351" }, { "step": 3563, "loss": 0.46062153577804565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.687269" }, { "step": 3564, "loss": 0.881056010723114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.825674" }, { "step": 3565, "loss": 0.47002172470092773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:23.922164" }, { "step": 3566, "loss": 0.8659512400627136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.012348" }, { "step": 3567, "loss": 0.8974915742874146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.105603" }, { "step": 3568, "loss": 0.6876376271247864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.200005" }, { "step": 3569, "loss": 0.8824435472488403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.284171" }, { "step": 3570, "loss": 0.923683226108551, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.397115" }, { "step": 3571, "loss": 1.074220895767212, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.486850" }, { "step": 3572, "loss": 0.6896129846572876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.605498" }, { "step": 3573, "loss": 0.6262019872665405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.698441" }, { "step": 3574, "loss": 0.9730312824249268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.809255" }, { "step": 3575, "loss": 0.6120641827583313, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.902412" }, { "step": 3576, "loss": 0.48997440934181213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:24.995000" }, { "step": 3577, "loss": 0.7177724242210388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.080072" }, { "step": 3578, "loss": 0.4814273416996002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.169322" }, { "step": 3579, "loss": 0.5457921624183655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.258788" }, { "step": 3580, "loss": 0.7539310455322266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.360836" }, { "step": 3581, "loss": 0.6182910799980164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.476226" }, { "step": 3582, "loss": 0.8037958741188049, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.562532" }, { "step": 3583, "loss": 0.8304908871650696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.647305" }, { "step": 3584, "loss": 0.7186700701713562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.733825" }, { "step": 3585, "loss": 0.7250931262969971, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.819038" }, { "step": 3586, "loss": 0.5332584381103516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:25.917831" }, { "step": 3587, "loss": 0.42800986766815186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.003692" }, { "step": 3588, "loss": 0.6573816537857056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.090737" }, { "step": 3589, "loss": 0.705070972442627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.201311" }, { "step": 3590, "loss": 0.6982009410858154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.294969" }, { "step": 3591, "loss": 0.9949502944946289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.401594" }, { "step": 3592, "loss": 1.0603227615356445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.491013" }, { "step": 3593, "loss": 0.7429453730583191, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.578627" }, { "step": 3594, "loss": 0.5903918743133545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.672964" }, { "step": 3595, "loss": 0.45461779832839966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.766720" }, { "step": 3596, "loss": 0.44448450207710266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.854804" }, { "step": 3597, "loss": 0.3757067918777466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:26.947134" }, { "step": 3598, "loss": 1.0282156467437744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.035044" }, { "step": 3599, "loss": 0.7234094738960266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.131928" }, { "step": 3600, "loss": 0.7314268350601196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.252256" }, { "step": 3601, "loss": 0.7107868790626526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.369031" }, { "step": 3602, "loss": 0.7932910919189453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.453778" }, { "step": 3603, "loss": 0.443325936794281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.544810" }, { "step": 3604, "loss": 0.7245004177093506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.637481" }, { "step": 3605, "loss": 0.8576837778091431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.724273" }, { "step": 3606, "loss": 0.719822883605957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.819588" }, { "step": 3607, "loss": 0.5354809165000916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:27.920234" }, { "step": 3608, "loss": 1.010793685913086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.043201" }, { "step": 3609, "loss": 0.7549999356269836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.128780" }, { "step": 3610, "loss": 0.8599822521209717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.215133" }, { "step": 3611, "loss": 0.8316090703010559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.328574" }, { "step": 3612, "loss": 0.6729289293289185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.413964" }, { "step": 3613, "loss": 0.5145192742347717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.503461" }, { "step": 3614, "loss": 0.4790854752063751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.589153" }, { "step": 3615, "loss": 0.49406516551971436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.674449" }, { "step": 3616, "loss": 0.626667857170105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.762797" }, { "step": 3617, "loss": 0.5661823153495789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.889695" }, { "step": 3618, "loss": 0.7214882969856262, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:28.975071" }, { "step": 3619, "loss": 0.7983721494674683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.061145" }, { "step": 3620, "loss": 0.6413308382034302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.147435" }, { "step": 3621, "loss": 0.33427131175994873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.232039" }, { "step": 3622, "loss": 0.5785319805145264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.324018" }, { "step": 3623, "loss": 0.6091713905334473, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.437481" }, { "step": 3624, "loss": 0.6647948026657104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.521325" }, { "step": 3625, "loss": 0.5258962512016296, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.614001" }, { "step": 3626, "loss": 0.7038394808769226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.709952" }, { "step": 3627, "loss": 0.5502418875694275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.816882" }, { "step": 3628, "loss": 0.7304177284240723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:29.928020" }, { "step": 3629, "loss": 0.6955971717834473, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.018926" }, { "step": 3630, "loss": 0.9733719825744629, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.104884" }, { "step": 3631, "loss": 1.1471389532089233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.194214" }, { "step": 3632, "loss": 0.4459802508354187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.293626" }, { "step": 3633, "loss": 0.6071240901947021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.385121" }, { "step": 3634, "loss": 0.8166104555130005, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.474133" }, { "step": 3635, "loss": 1.1864073276519775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.589618" }, { "step": 3636, "loss": 1.1113218069076538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.701970" }, { "step": 3637, "loss": 0.4787006974220276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.795322" }, { "step": 3638, "loss": 0.6308423280715942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.886853" }, { "step": 3639, "loss": 0.7467048764228821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:30.970888" }, { "step": 3640, "loss": 0.5724970698356628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.062495" }, { "step": 3641, "loss": 0.7029925584793091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.155732" }, { "step": 3642, "loss": 0.6001988649368286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.243126" }, { "step": 3643, "loss": 0.638079047203064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.331501" }, { "step": 3644, "loss": 0.5700355172157288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.421458" }, { "step": 3645, "loss": 0.735521674156189, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.539217" }, { "step": 3646, "loss": 0.7169949412345886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.661156" }, { "step": 3647, "loss": 0.9410363435745239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.771222" }, { "step": 3648, "loss": 0.632689356803894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.866049" }, { "step": 3649, "loss": 0.6644178032875061, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:31.967078" }, { "step": 3650, "loss": 0.6317693591117859, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.084682" }, { "step": 3651, "loss": 0.7364147901535034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.188591" }, { "step": 3652, "loss": 0.3768696188926697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.275861" }, { "step": 3653, "loss": 0.5961657166481018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.375538" }, { "step": 3654, "loss": 0.9141355156898499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.493208" }, { "step": 3655, "loss": 0.616354763507843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.578872" }, { "step": 3656, "loss": 0.8282501101493835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.664154" }, { "step": 3657, "loss": 0.6012710332870483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.757771" }, { "step": 3658, "loss": 0.5668606162071228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.849129" }, { "step": 3659, "loss": 0.6860662698745728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:32.933884" }, { "step": 3660, "loss": 0.7705544233322144, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.050345" }, { "step": 3661, "loss": 0.7448934316635132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.143903" }, { "step": 3662, "loss": 0.5297625660896301, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.228665" }, { "step": 3663, "loss": 0.8690376281738281, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.351228" }, { "step": 3664, "loss": 0.9005142450332642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.442939" }, { "step": 3665, "loss": 0.3628401756286621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.544408" }, { "step": 3666, "loss": 0.5070520639419556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.638849" }, { "step": 3667, "loss": 0.7471835613250732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.724921" }, { "step": 3668, "loss": 0.7964947819709778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.814098" }, { "step": 3669, "loss": 0.8322948217391968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.906797" }, { "step": 3670, "loss": 0.42720967531204224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:33.999312" }, { "step": 3671, "loss": 0.5922530889511108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.118347" }, { "step": 3672, "loss": 1.0912920236587524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.231762" }, { "step": 3673, "loss": 0.9594671130180359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.317438" }, { "step": 3674, "loss": 0.7093074321746826, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.404077" }, { "step": 3675, "loss": 0.9246851205825806, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.523493" }, { "step": 3676, "loss": 0.6941893100738525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.608963" }, { "step": 3677, "loss": 0.5509451031684875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.702715" }, { "step": 3678, "loss": 0.6163704991340637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.788043" }, { "step": 3679, "loss": 0.7541394233703613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.879315" }, { "step": 3680, "loss": 0.6322023272514343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:34.972170" }, { "step": 3681, "loss": 0.5868147611618042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.062291" }, { "step": 3682, "loss": 0.8840354084968567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.147504" }, { "step": 3683, "loss": 1.0008115768432617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.233887" }, { "step": 3684, "loss": 0.9089349508285522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.319327" }, { "step": 3685, "loss": 0.9276180863380432, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.435764" }, { "step": 3686, "loss": 1.013383150100708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.524620" }, { "step": 3687, "loss": 1.0332316160202026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.614631" }, { "step": 3688, "loss": 0.5806143879890442, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.710242" }, { "step": 3689, "loss": 0.36834806203842163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.798015" }, { "step": 3690, "loss": 0.7223271131515503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.884441" }, { "step": 3691, "loss": 0.6843900084495544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:35.978904" }, { "step": 3692, "loss": 0.6883947849273682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.069123" }, { "step": 3693, "loss": 0.6528030633926392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.160788" }, { "step": 3694, "loss": 1.0236990451812744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.255257" }, { "step": 3695, "loss": 0.555962324142456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.348342" }, { "step": 3696, "loss": 0.4237266480922699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.438036" }, { "step": 3697, "loss": 0.770813524723053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.536392" }, { "step": 3698, "loss": 0.8070050477981567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.650520" }, { "step": 3699, "loss": 0.41004520654678345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.746905" }, { "step": 3700, "loss": 0.4837310314178467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.836325" }, { "step": 3701, "loss": 0.7641002535820007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:36.921651" }, { "step": 3702, "loss": 0.6994880437850952, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.010386" }, { "step": 3703, "loss": 0.6106986403465271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.095855" }, { "step": 3704, "loss": 0.7010657787322998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.180574" }, { "step": 3705, "loss": 0.4799851179122925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.274492" }, { "step": 3706, "loss": 0.5144515037536621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.359208" }, { "step": 3707, "loss": 0.9157500267028809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.447801" }, { "step": 3708, "loss": 0.9376178979873657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.532206" }, { "step": 3709, "loss": 0.7311238646507263, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.617487" }, { "step": 3710, "loss": 0.5474494695663452, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.704266" }, { "step": 3711, "loss": 0.9260586500167847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.811976" }, { "step": 3712, "loss": 0.6355711221694946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:37.907306" }, { "step": 3713, "loss": 0.8687762022018433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.018198" }, { "step": 3714, "loss": 0.4934754967689514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.103836" }, { "step": 3715, "loss": 0.34082210063934326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.189382" }, { "step": 3716, "loss": 0.7327447533607483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.285738" }, { "step": 3717, "loss": 0.5794742703437805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.383232" }, { "step": 3718, "loss": 0.8810709714889526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.499143" }, { "step": 3719, "loss": 1.0295714139938354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.591981" }, { "step": 3720, "loss": 0.7161111831665039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.676334" }, { "step": 3721, "loss": 0.9044063091278076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.787226" }, { "step": 3722, "loss": 0.5674468278884888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.874398" }, { "step": 3723, "loss": 1.1358885765075684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:38.960786" }, { "step": 3724, "loss": 0.8772875666618347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.046360" }, { "step": 3725, "loss": 0.7658478617668152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.159192" }, { "step": 3726, "loss": 0.6888095140457153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.249438" }, { "step": 3727, "loss": 0.9181180000305176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.364647" }, { "step": 3728, "loss": 0.90409255027771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.450343" }, { "step": 3729, "loss": 0.6584352254867554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.536809" }, { "step": 3730, "loss": 0.7528303861618042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.648787" }, { "step": 3731, "loss": 0.6876543760299683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.733773" }, { "step": 3732, "loss": 0.5567758679389954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.820688" }, { "step": 3733, "loss": 0.9574236869812012, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.907203" }, { "step": 3734, "loss": 0.7155889868736267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:39.993047" }, { "step": 3735, "loss": 0.48936426639556885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.092817" }, { "step": 3736, "loss": 0.6676915884017944, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.203132" }, { "step": 3737, "loss": 1.0187863111495972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.290394" }, { "step": 3738, "loss": 0.9688100218772888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.427550" }, { "step": 3739, "loss": 0.8519027829170227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.546116" }, { "step": 3740, "loss": 0.6440362930297852, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.632176" }, { "step": 3741, "loss": 0.48718804121017456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.721510" }, { "step": 3742, "loss": 0.6604347229003906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.841071" }, { "step": 3743, "loss": 0.7549257874488831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:40.950042" }, { "step": 3744, "loss": 0.707741916179657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.038250" }, { "step": 3745, "loss": 0.8364392518997192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.154778" }, { "step": 3746, "loss": 1.03413987159729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.260910" }, { "step": 3747, "loss": 1.4037995338439941, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.347102" }, { "step": 3748, "loss": 0.9252796173095703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.436057" }, { "step": 3749, "loss": 0.716728687286377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.523080" }, { "step": 3750, "loss": 0.6589453816413879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.615846" }, { "step": 3751, "loss": 0.499381422996521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.709071" }, { "step": 3752, "loss": 1.0393052101135254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.823690" }, { "step": 3753, "loss": 0.6436030268669128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:41.932122" }, { "step": 3754, "loss": 0.7845348715782166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.023995" }, { "step": 3755, "loss": 0.642532229423523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.135526" }, { "step": 3756, "loss": 0.627705454826355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.227662" }, { "step": 3757, "loss": 0.6232059597969055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.325928" }, { "step": 3758, "loss": 0.7805129885673523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.412422" }, { "step": 3759, "loss": 0.3383028507232666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.507962" }, { "step": 3760, "loss": 0.5449435710906982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.599593" }, { "step": 3761, "loss": 0.3998754024505615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.693011" }, { "step": 3762, "loss": 1.04180908203125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.781687" }, { "step": 3763, "loss": 0.6184144616127014, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.870288" }, { "step": 3764, "loss": 0.7078834772109985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:42.986157" }, { "step": 3765, "loss": 0.7574266791343689, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.080597" }, { "step": 3766, "loss": 0.6007462739944458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.175030" }, { "step": 3767, "loss": 0.6444622278213501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.292027" }, { "step": 3768, "loss": 0.9065086245536804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.381590" }, { "step": 3769, "loss": 0.776779294013977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.492922" }, { "step": 3770, "loss": 0.9101958274841309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.586372" }, { "step": 3771, "loss": 0.764866828918457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.675532" }, { "step": 3772, "loss": 0.7430555820465088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.760586" }, { "step": 3773, "loss": 0.9115076065063477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.845117" }, { "step": 3774, "loss": 0.5963147878646851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:43.938363" }, { "step": 3775, "loss": 0.747352123260498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.040140" }, { "step": 3776, "loss": 1.0798752307891846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.124737" }, { "step": 3777, "loss": 1.2867696285247803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.220006" }, { "step": 3778, "loss": 0.5937581062316895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.312715" }, { "step": 3779, "loss": 0.965147852897644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.399862" }, { "step": 3780, "loss": 1.0376886129379272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.487306" }, { "step": 3781, "loss": 0.6563605070114136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.585160" }, { "step": 3782, "loss": 0.7455357313156128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.676339" }, { "step": 3783, "loss": 0.5267466306686401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.772616" }, { "step": 3784, "loss": 0.9769341945648193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.905513" }, { "step": 3785, "loss": 0.6118327379226685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:44.997840" }, { "step": 3786, "loss": 0.8331000804901123, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.084134" }, { "step": 3787, "loss": 0.5677124261856079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.175618" }, { "step": 3788, "loss": 1.0221253633499146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.262292" }, { "step": 3789, "loss": 0.8584257960319519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.353254" }, { "step": 3790, "loss": 0.5858149528503418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.446594" }, { "step": 3791, "loss": 0.6356329917907715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.542280" }, { "step": 3792, "loss": 0.4863981008529663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.632432" }, { "step": 3793, "loss": 0.4373018741607666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.725014" }, { "step": 3794, "loss": 0.3175414800643921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.820895" }, { "step": 3795, "loss": 0.9288845658302307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:45.932609" }, { "step": 3796, "loss": 0.5736441016197205, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.032670" }, { "step": 3797, "loss": 0.5892098546028137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.126094" }, { "step": 3798, "loss": 0.8151489496231079, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.217483" }, { "step": 3799, "loss": 0.997282862663269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.302291" }, { "step": 3800, "loss": 0.9171749949455261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.393379" }, { "step": 3801, "loss": 0.7817769050598145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.510279" }, { "step": 3802, "loss": 0.777082085609436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.596472" }, { "step": 3803, "loss": 0.5281125903129578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.694401" }, { "step": 3804, "loss": 0.7704322934150696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.802169" }, { "step": 3805, "loss": 0.5861756205558777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.889970" }, { "step": 3806, "loss": 0.633542001247406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:46.975549" }, { "step": 3807, "loss": 0.5120316743850708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.069571" }, { "step": 3808, "loss": 0.7742984294891357, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.167850" }, { "step": 3809, "loss": 1.1578983068466187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.294634" }, { "step": 3810, "loss": 0.53494793176651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.378738" }, { "step": 3811, "loss": 0.8140360116958618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.465867" }, { "step": 3812, "loss": 0.6005450487136841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.552919" }, { "step": 3813, "loss": 0.7515520453453064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.638619" }, { "step": 3814, "loss": 0.8575421571731567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.723576" }, { "step": 3815, "loss": 0.482310950756073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.809431" }, { "step": 3816, "loss": 0.8988614082336426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:47.929401" }, { "step": 3817, "loss": 0.6670653223991394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.015119" }, { "step": 3818, "loss": 0.8676003217697144, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.106124" }, { "step": 3819, "loss": 0.8949428796768188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.198043" }, { "step": 3820, "loss": 0.43583667278289795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.294044" }, { "step": 3821, "loss": 0.7281476259231567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.385523" }, { "step": 3822, "loss": 0.5526284575462341, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.480292" }, { "step": 3823, "loss": 0.6508012413978577, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.568057" }, { "step": 3824, "loss": 0.4186936020851135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.652908" }, { "step": 3825, "loss": 0.8282821178436279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.748995" }, { "step": 3826, "loss": 0.5980455875396729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.841499" }, { "step": 3827, "loss": 0.4874056279659271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:48.930751" }, { "step": 3828, "loss": 0.4637134373188019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.023594" }, { "step": 3829, "loss": 0.7659237384796143, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.119975" }, { "step": 3830, "loss": 0.3937724232673645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.210728" }, { "step": 3831, "loss": 0.6205287575721741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.297649" }, { "step": 3832, "loss": 0.8640695810317993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.383308" }, { "step": 3833, "loss": 0.6377121806144714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.469913" }, { "step": 3834, "loss": 0.7882275581359863, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.560545" }, { "step": 3835, "loss": 0.36736488342285156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.646613" }, { "step": 3836, "loss": 0.7054440379142761, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.772813" }, { "step": 3837, "loss": 0.40633338689804077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.886999" }, { "step": 3838, "loss": 0.3991587162017822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:49.981802" }, { "step": 3839, "loss": 0.678564190864563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.069164" }, { "step": 3840, "loss": 0.729189395904541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.179835" }, { "step": 3841, "loss": 0.6585935354232788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.267162" }, { "step": 3842, "loss": 0.8656661510467529, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.359981" }, { "step": 3843, "loss": 0.47487369179725647, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.445586" }, { "step": 3844, "loss": 0.4533774256706238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.542329" }, { "step": 3845, "loss": 0.6545374393463135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.655397" }, { "step": 3846, "loss": 0.6410188674926758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.748756" }, { "step": 3847, "loss": 0.6597904562950134, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.841097" }, { "step": 3848, "loss": 0.7970589995384216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:50.942120" }, { "step": 3849, "loss": 0.7634475231170654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.028448" }, { "step": 3850, "loss": 0.594353199005127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.119683" }, { "step": 3851, "loss": 0.6865619421005249, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.216718" }, { "step": 3852, "loss": 0.7583773136138916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.306016" }, { "step": 3853, "loss": 0.40857505798339844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.398699" }, { "step": 3854, "loss": 0.5122948288917542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.496154" }, { "step": 3855, "loss": 0.6941314339637756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.583760" }, { "step": 3856, "loss": 0.33336782455444336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.677266" }, { "step": 3857, "loss": 0.5197548270225525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.763095" }, { "step": 3858, "loss": 1.0236433744430542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.871668" }, { "step": 3859, "loss": 0.5878387689590454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:51.965209" }, { "step": 3860, "loss": 0.7457133531570435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.051956" }, { "step": 3861, "loss": 0.5337116718292236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.141831" }, { "step": 3862, "loss": 0.6696224212646484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.235201" }, { "step": 3863, "loss": 0.6967436075210571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.333609" }, { "step": 3864, "loss": 0.5076850056648254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.433442" }, { "step": 3865, "loss": 0.6388886570930481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.522332" }, { "step": 3866, "loss": 0.5532984733581543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.612924" }, { "step": 3867, "loss": 0.6844455599784851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.733597" }, { "step": 3868, "loss": 0.5014735460281372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.820207" }, { "step": 3869, "loss": 0.7701956629753113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:52.929939" }, { "step": 3870, "loss": 0.5236565470695496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.020872" }, { "step": 3871, "loss": 1.1502697467803955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.109916" }, { "step": 3872, "loss": 0.6324100494384766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.202132" }, { "step": 3873, "loss": 0.44990378618240356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.292458" }, { "step": 3874, "loss": 0.7977269887924194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.407693" }, { "step": 3875, "loss": 0.6709052324295044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.500520" }, { "step": 3876, "loss": 0.6257103681564331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.585281" }, { "step": 3877, "loss": 0.7445796728134155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.695736" }, { "step": 3878, "loss": 0.6625194549560547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.810413" }, { "step": 3879, "loss": 0.6083663105964661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:53.894565" }, { "step": 3880, "loss": 0.8269760608673096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.002837" }, { "step": 3881, "loss": 0.8380786180496216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.095465" }, { "step": 3882, "loss": 0.8245964646339417, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.180479" }, { "step": 3883, "loss": 0.4577597379684448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.280883" }, { "step": 3884, "loss": 0.6267037391662598, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.373607" }, { "step": 3885, "loss": 1.0632541179656982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.463171" }, { "step": 3886, "loss": 0.47170355916023254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.549646" }, { "step": 3887, "loss": 0.9504173994064331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.638409" }, { "step": 3888, "loss": 0.6634811162948608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.732208" }, { "step": 3889, "loss": 0.8237631320953369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.840808" }, { "step": 3890, "loss": 0.7664029598236084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:54.940593" }, { "step": 3891, "loss": 0.7298884391784668, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.062459" }, { "step": 3892, "loss": 0.6328850984573364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.159508" }, { "step": 3893, "loss": 0.550250768661499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.254235" }, { "step": 3894, "loss": 0.43488091230392456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.338094" }, { "step": 3895, "loss": 0.6637378931045532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.431153" }, { "step": 3896, "loss": 0.4592525362968445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.533139" }, { "step": 3897, "loss": 0.7020137310028076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.642899" }, { "step": 3898, "loss": 0.6709515452384949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.742243" }, { "step": 3899, "loss": 0.7567781805992126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.834612" }, { "step": 3900, "loss": 0.7741481065750122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:55.949596" }, { "step": 3901, "loss": 0.8861987590789795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.058440" }, { "step": 3902, "loss": 1.112809658050537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.175275" }, { "step": 3903, "loss": 0.5851202011108398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.288548" }, { "step": 3904, "loss": 0.7429981827735901, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.373644" }, { "step": 3905, "loss": 0.7911025285720825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.466850" }, { "step": 3906, "loss": 1.048440933227539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.577357" }, { "step": 3907, "loss": 0.515114426612854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.670096" }, { "step": 3908, "loss": 0.9663360118865967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.756700" }, { "step": 3909, "loss": 0.9438917636871338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.870118" }, { "step": 3910, "loss": 1.0628165006637573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:56.956649" }, { "step": 3911, "loss": 0.629417896270752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.056544" }, { "step": 3912, "loss": 0.6651716828346252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.142791" }, { "step": 3913, "loss": 1.0152263641357422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.255241" }, { "step": 3914, "loss": 0.7804566621780396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.364571" }, { "step": 3915, "loss": 1.0326751470565796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.457331" }, { "step": 3916, "loss": 0.2073667049407959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.545734" }, { "step": 3917, "loss": 0.901570200920105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.657066" }, { "step": 3918, "loss": 1.0000649690628052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.766794" }, { "step": 3919, "loss": 0.7748817205429077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.878159" }, { "step": 3920, "loss": 0.9676152467727661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:57.984592" }, { "step": 3921, "loss": 0.46573230624198914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.070631" }, { "step": 3922, "loss": 0.921971321105957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.162200" }, { "step": 3923, "loss": 0.7731993198394775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.271458" }, { "step": 3924, "loss": 0.8112424612045288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.366087" }, { "step": 3925, "loss": 0.6203204989433289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.454700" }, { "step": 3926, "loss": 0.6171555519104004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.549079" }, { "step": 3927, "loss": 0.8812916278839111, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.634794" }, { "step": 3928, "loss": 0.6074208617210388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.721486" }, { "step": 3929, "loss": 0.8371692895889282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.816776" }, { "step": 3930, "loss": 0.5349801182746887, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:58.915720" }, { "step": 3931, "loss": 0.5506554841995239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.004858" }, { "step": 3932, "loss": 1.2693202495574951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.102298" }, { "step": 3933, "loss": 0.7280970811843872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.203815" }, { "step": 3934, "loss": 0.6599118709564209, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.321071" }, { "step": 3935, "loss": 0.6205664873123169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.426794" }, { "step": 3936, "loss": 0.5284850597381592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.512951" }, { "step": 3937, "loss": 0.8353404998779297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.601264" }, { "step": 3938, "loss": 0.45644810795783997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.687407" }, { "step": 3939, "loss": 0.5378122329711914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.782935" }, { "step": 3940, "loss": 0.6036854982376099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.871433" }, { "step": 3941, "loss": 0.7459092140197754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:31:59.959013" }, { "step": 3942, "loss": 1.1234976053237915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.045037" }, { "step": 3943, "loss": 0.6743196249008179, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.139025" }, { "step": 3944, "loss": 0.7348915338516235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.250670" }, { "step": 3945, "loss": 1.0061143636703491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.335559" }, { "step": 3946, "loss": 0.9100029468536377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.448326" }, { "step": 3947, "loss": 0.7213761210441589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.542556" }, { "step": 3948, "loss": 0.8381941318511963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.631452" }, { "step": 3949, "loss": 0.539997935295105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.716195" }, { "step": 3950, "loss": 0.38676056265830994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.807729" }, { "step": 3951, "loss": 0.8227089643478394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.898906" }, { "step": 3952, "loss": 0.7002990245819092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:00.988716" }, { "step": 3953, "loss": 0.7482572793960571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.072329" }, { "step": 3954, "loss": 0.8617259860038757, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.159019" }, { "step": 3955, "loss": 0.5332213044166565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.249117" }, { "step": 3956, "loss": 0.7223800420761108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.334537" }, { "step": 3957, "loss": 0.683306097984314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.425807" }, { "step": 3958, "loss": 0.8025012016296387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.518873" }, { "step": 3959, "loss": 0.5490981340408325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.605200" }, { "step": 3960, "loss": 0.9908750057220459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.690009" }, { "step": 3961, "loss": 0.7306417226791382, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.783288" }, { "step": 3962, "loss": 0.6773824691772461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.870207" }, { "step": 3963, "loss": 1.0408869981765747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:01.978992" }, { "step": 3964, "loss": 0.6503681540489197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.072824" }, { "step": 3965, "loss": 0.8559301495552063, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.164020" }, { "step": 3966, "loss": 0.3393673598766327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.256261" }, { "step": 3967, "loss": 0.6426959037780762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.347648" }, { "step": 3968, "loss": 1.0721796751022339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.461388" }, { "step": 3969, "loss": 0.7185088396072388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.559469" }, { "step": 3970, "loss": 0.6529883742332458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.644267" }, { "step": 3971, "loss": 0.7497450113296509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.735029" }, { "step": 3972, "loss": 0.7564785480499268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.829776" }, { "step": 3973, "loss": 0.4563884139060974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:02.921831" }, { "step": 3974, "loss": 0.6542634963989258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.022317" }, { "step": 3975, "loss": 0.7994625568389893, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.140183" }, { "step": 3976, "loss": 0.8212692141532898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.230093" }, { "step": 3977, "loss": 0.5908328294754028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.349626" }, { "step": 3978, "loss": 0.6284643411636353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.436110" }, { "step": 3979, "loss": 0.6739707589149475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.521920" }, { "step": 3980, "loss": 0.7475026845932007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.613115" }, { "step": 3981, "loss": 0.6278472542762756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.705616" }, { "step": 3982, "loss": 0.38390249013900757, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.796857" }, { "step": 3983, "loss": 0.7947949767112732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.902633" }, { "step": 3984, "loss": 1.3024288415908813, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:03.988892" }, { "step": 3985, "loss": 1.004842758178711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.075488" }, { "step": 3986, "loss": 0.6497655510902405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.160276" }, { "step": 3987, "loss": 0.6036663055419922, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.282745" }, { "step": 3988, "loss": 1.0144940614700317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.376923" }, { "step": 3989, "loss": 0.6820271015167236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.463205" }, { "step": 3990, "loss": 0.853291928768158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.552551" }, { "step": 3991, "loss": 0.4772564470767975, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.638040" }, { "step": 3992, "loss": 0.8628254532814026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.728989" }, { "step": 3993, "loss": 0.5235018730163574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.814836" }, { "step": 3994, "loss": 0.9084811210632324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:04.926690" }, { "step": 3995, "loss": 0.6888834238052368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.014323" }, { "step": 3996, "loss": 0.5559325814247131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.108169" }, { "step": 3997, "loss": 0.6592106223106384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.201398" }, { "step": 3998, "loss": 0.7409629821777344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.293264" }, { "step": 3999, "loss": 0.5546070337295532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.393329" }, { "step": 4000, "loss": 0.529172956943512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:05.481631" }, { "step": 4001, "loss": 0.7721158266067505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:28.686875" }, { "step": 4002, "loss": 0.4236280918121338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:28.774597" }, { "step": 4003, "loss": 0.6624025702476501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:28.863389" }, { "step": 4004, "loss": 0.9457405209541321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:28.981102" }, { "step": 4005, "loss": 1.0044499635696411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.093871" }, { "step": 4006, "loss": 0.6338508725166321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.186169" }, { "step": 4007, "loss": 0.7778016328811646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.275964" }, { "step": 4008, "loss": 0.6187494397163391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.363512" }, { "step": 4009, "loss": 1.1156940460205078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.449098" }, { "step": 4010, "loss": 0.3965778648853302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.541337" }, { "step": 4011, "loss": 0.6052382588386536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.655505" }, { "step": 4012, "loss": 0.642773449420929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.745722" }, { "step": 4013, "loss": 0.7891987562179565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.858748" }, { "step": 4014, "loss": 0.642695426940918, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:29.969049" }, { "step": 4015, "loss": 0.8371440172195435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.060029" }, { "step": 4016, "loss": 0.6664531230926514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.149259" }, { "step": 4017, "loss": 0.8093774914741516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.236170" }, { "step": 4018, "loss": 1.0280113220214844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.323653" }, { "step": 4019, "loss": 0.621310830116272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.411683" }, { "step": 4020, "loss": 0.4928836226463318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.504314" }, { "step": 4021, "loss": 0.824362576007843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.590275" }, { "step": 4022, "loss": 0.6435485482215881, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.684861" }, { "step": 4023, "loss": 0.6176392436027527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.772284" }, { "step": 4024, "loss": 0.5529811978340149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.857609" }, { "step": 4025, "loss": 1.1394717693328857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:30.944484" }, { "step": 4026, "loss": 0.38792097568511963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.029600" }, { "step": 4027, "loss": 0.6751983165740967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.125431" }, { "step": 4028, "loss": 0.7245601415634155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.244614" }, { "step": 4029, "loss": 0.8703557848930359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.332566" }, { "step": 4030, "loss": 0.608992338180542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.428571" }, { "step": 4031, "loss": 0.4422937035560608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.514720" }, { "step": 4032, "loss": 0.6598802804946899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.600170" }, { "step": 4033, "loss": 0.8396927118301392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.716867" }, { "step": 4034, "loss": 0.6176949739456177, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.804489" }, { "step": 4035, "loss": 0.47083160281181335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.895958" }, { "step": 4036, "loss": 0.9076707363128662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:31.988572" }, { "step": 4037, "loss": 0.6115739941596985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.074134" }, { "step": 4038, "loss": 0.5895137786865234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.161154" }, { "step": 4039, "loss": 0.6104173064231873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.247156" }, { "step": 4040, "loss": 0.5689780712127686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.340698" }, { "step": 4041, "loss": 0.64420485496521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.440574" }, { "step": 4042, "loss": 0.7202086448669434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.534910" }, { "step": 4043, "loss": 0.6554638147354126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.625989" }, { "step": 4044, "loss": 0.5918036699295044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.714557" }, { "step": 4045, "loss": 0.5589925646781921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.806038" }, { "step": 4046, "loss": 0.4677150845527649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:32.896320" }, { "step": 4047, "loss": 0.9348326921463013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.022238" }, { "step": 4048, "loss": 1.0543947219848633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.141428" }, { "step": 4049, "loss": 0.7945642471313477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.229390" }, { "step": 4050, "loss": 0.8686156868934631, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.316927" }, { "step": 4051, "loss": 0.49475425481796265, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.435733" }, { "step": 4052, "loss": 0.49585455656051636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.527700" }, { "step": 4053, "loss": 0.5495976805686951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.618916" }, { "step": 4054, "loss": 1.0071601867675781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.767508" }, { "step": 4055, "loss": 0.7983084917068481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.887401" }, { "step": 4056, "loss": 0.6560873985290527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:33.971775" }, { "step": 4057, "loss": 0.7737902402877808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.062923" }, { "step": 4058, "loss": 0.3686009347438812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.156901" }, { "step": 4059, "loss": 1.1093248128890991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.243144" }, { "step": 4060, "loss": 0.7270784974098206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.348678" }, { "step": 4061, "loss": 0.8093085289001465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.456613" }, { "step": 4062, "loss": 0.6990854740142822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.576889" }, { "step": 4063, "loss": 0.6174101829528809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.661289" }, { "step": 4064, "loss": 0.620352566242218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.751834" }, { "step": 4065, "loss": 1.1984206438064575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.840782" }, { "step": 4066, "loss": 0.6955686211585999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:34.932489" }, { "step": 4067, "loss": 0.7026939392089844, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.050738" }, { "step": 4068, "loss": 0.7015250325202942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.141014" }, { "step": 4069, "loss": 0.44732385873794556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.234619" }, { "step": 4070, "loss": 0.921484112739563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.330111" }, { "step": 4071, "loss": 0.8782689571380615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.417072" }, { "step": 4072, "loss": 0.45499229431152344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.511311" }, { "step": 4073, "loss": 0.4817284941673279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.603459" }, { "step": 4074, "loss": 0.8155599236488342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.688786" }, { "step": 4075, "loss": 0.6429685950279236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.781385" }, { "step": 4076, "loss": 1.0064184665679932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.894666" }, { "step": 4077, "loss": 1.0803050994873047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:35.984179" }, { "step": 4078, "loss": 0.5805218815803528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.070019" }, { "step": 4079, "loss": 0.6859188079833984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.156264" }, { "step": 4080, "loss": 0.7243739366531372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.264834" }, { "step": 4081, "loss": 0.6213406920433044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.351788" }, { "step": 4082, "loss": 0.8537807464599609, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.439056" }, { "step": 4083, "loss": 0.62555330991745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.530048" }, { "step": 4084, "loss": 0.8097885847091675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.614055" }, { "step": 4085, "loss": 0.7200748920440674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.710668" }, { "step": 4086, "loss": 0.4248407483100891, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.803336" }, { "step": 4087, "loss": 1.2589819431304932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.890955" }, { "step": 4088, "loss": 0.7321971654891968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:36.974989" }, { "step": 4089, "loss": 0.9110621213912964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.113822" }, { "step": 4090, "loss": 0.47061342000961304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.200807" }, { "step": 4091, "loss": 0.7839922308921814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.288309" }, { "step": 4092, "loss": 0.8927522897720337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.428718" }, { "step": 4093, "loss": 0.7656604051589966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.520147" }, { "step": 4094, "loss": 0.730659544467926, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.610118" }, { "step": 4095, "loss": 0.5360363125801086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.695893" }, { "step": 4096, "loss": 0.7469783425331116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.794011" }, { "step": 4097, "loss": 0.5818971395492554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.885636" }, { "step": 4098, "loss": 0.793914258480072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:37.977110" }, { "step": 4099, "loss": 0.677129328250885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.072974" }, { "step": 4100, "loss": 0.8178413510322571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.190445" }, { "step": 4101, "loss": 0.7197195887565613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.278543" }, { "step": 4102, "loss": 0.8234142661094666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.386579" }, { "step": 4103, "loss": 0.7026233077049255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.476353" }, { "step": 4104, "loss": 0.4637237787246704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.566768" }, { "step": 4105, "loss": 0.7488948106765747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.653440" }, { "step": 4106, "loss": 0.48793840408325195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.741906" }, { "step": 4107, "loss": 0.6086101531982422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.831091" }, { "step": 4108, "loss": 0.9469621181488037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:38.946434" }, { "step": 4109, "loss": 0.6449520587921143, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.042836" }, { "step": 4110, "loss": 0.5520005226135254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.143026" }, { "step": 4111, "loss": 0.7848498225212097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.229922" }, { "step": 4112, "loss": 0.8217064142227173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.347290" }, { "step": 4113, "loss": 0.5945601463317871, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.442125" }, { "step": 4114, "loss": 0.4701143801212311, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.530114" }, { "step": 4115, "loss": 0.5185568332672119, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.617031" }, { "step": 4116, "loss": 0.6884576678276062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.710999" }, { "step": 4117, "loss": 0.44937992095947266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.798408" }, { "step": 4118, "loss": 0.6578072309494019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.884486" }, { "step": 4119, "loss": 0.8040587306022644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:39.971241" }, { "step": 4120, "loss": 0.8668879270553589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.076526" }, { "step": 4121, "loss": 0.5775039196014404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.161540" }, { "step": 4122, "loss": 0.753852128982544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.262915" }, { "step": 4123, "loss": 0.6173755526542664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.352465" }, { "step": 4124, "loss": 0.6625674366950989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.448176" }, { "step": 4125, "loss": 0.8039708137512207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.534755" }, { "step": 4126, "loss": 0.9872462749481201, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.629565" }, { "step": 4127, "loss": 0.40502259135246277, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.719289" }, { "step": 4128, "loss": 0.5676488876342773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.806900" }, { "step": 4129, "loss": 0.8115606904029846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.892139" }, { "step": 4130, "loss": 0.5888932943344116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:40.985005" }, { "step": 4131, "loss": 0.6250647306442261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.071904" }, { "step": 4132, "loss": 0.6283441781997681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.161230" }, { "step": 4133, "loss": 0.3866039514541626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.261330" }, { "step": 4134, "loss": 0.5865382552146912, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.361336" }, { "step": 4135, "loss": 0.44355833530426025, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.454087" }, { "step": 4136, "loss": 1.2028391361236572, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.540526" }, { "step": 4137, "loss": 0.7964454293251038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.634209" }, { "step": 4138, "loss": 0.6054728627204895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.734857" }, { "step": 4139, "loss": 0.8584482669830322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.848695" }, { "step": 4140, "loss": 0.63525390625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:41.942386" }, { "step": 4141, "loss": 0.41986480355262756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.055013" }, { "step": 4142, "loss": 0.8249824047088623, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.166503" }, { "step": 4143, "loss": 0.7795582413673401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.281568" }, { "step": 4144, "loss": 0.4930325746536255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.379862" }, { "step": 4145, "loss": 0.48129141330718994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.472589" }, { "step": 4146, "loss": 0.6040972471237183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.565944" }, { "step": 4147, "loss": 0.9783791899681091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.685176" }, { "step": 4148, "loss": 0.799782931804657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.770328" }, { "step": 4149, "loss": 0.8367986679077148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.872931" }, { "step": 4150, "loss": 0.8127198219299316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:42.965454" }, { "step": 4151, "loss": 0.6161424517631531, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.060713" }, { "step": 4152, "loss": 0.427482008934021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.153840" }, { "step": 4153, "loss": 0.6769545078277588, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.239273" }, { "step": 4154, "loss": 0.5466437339782715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.325638" }, { "step": 4155, "loss": 0.5093727707862854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.411649" }, { "step": 4156, "loss": 1.0981965065002441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.497083" }, { "step": 4157, "loss": 0.5937954187393188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.593941" }, { "step": 4158, "loss": 0.49312514066696167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.678758" }, { "step": 4159, "loss": 0.6413602828979492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.772289" }, { "step": 4160, "loss": 0.4104771018028259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.872394" }, { "step": 4161, "loss": 0.9482293128967285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:43.994547" }, { "step": 4162, "loss": 0.6327148079872131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.081198" }, { "step": 4163, "loss": 0.9197015166282654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.175154" }, { "step": 4164, "loss": 0.7999700903892517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.268050" }, { "step": 4165, "loss": 0.9142574071884155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.354910" }, { "step": 4166, "loss": 0.9262833595275879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.476017" }, { "step": 4167, "loss": 0.9039719104766846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.592804" }, { "step": 4168, "loss": 0.8186023235321045, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.711758" }, { "step": 4169, "loss": 0.8294554948806763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.813684" }, { "step": 4170, "loss": 0.9678144454956055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:44.934625" }, { "step": 4171, "loss": 0.8283734321594238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.019156" }, { "step": 4172, "loss": 0.7793818712234497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.107569" }, { "step": 4173, "loss": 0.8335491418838501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.220222" }, { "step": 4174, "loss": 0.31014904379844666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.312723" }, { "step": 4175, "loss": 0.49891817569732666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.405385" }, { "step": 4176, "loss": 0.41393715143203735, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.489948" }, { "step": 4177, "loss": 0.5017579197883606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.578662" }, { "step": 4178, "loss": 0.8867490291595459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.665305" }, { "step": 4179, "loss": 0.6076840162277222, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.754429" }, { "step": 4180, "loss": 0.38394051790237427, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.839903" }, { "step": 4181, "loss": 0.6770573258399963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:45.928979" }, { "step": 4182, "loss": 0.6449228525161743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.021225" }, { "step": 4183, "loss": 0.6932756900787354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.144047" }, { "step": 4184, "loss": 1.0645697116851807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.235122" }, { "step": 4185, "loss": 0.5349183082580566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.345326" }, { "step": 4186, "loss": 0.7996063232421875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.462588" }, { "step": 4187, "loss": 0.7084819078445435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.557385" }, { "step": 4188, "loss": 0.8115304708480835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.646318" }, { "step": 4189, "loss": 0.5351648330688477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.741266" }, { "step": 4190, "loss": 0.48866474628448486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.826049" }, { "step": 4191, "loss": 0.6347789764404297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:46.917111" }, { "step": 4192, "loss": 0.5569772720336914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.008287" }, { "step": 4193, "loss": 0.874649167060852, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.099164" }, { "step": 4194, "loss": 0.9336013793945312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.242445" }, { "step": 4195, "loss": 1.1781965494155884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.328913" }, { "step": 4196, "loss": 0.6637974381446838, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.420386" }, { "step": 4197, "loss": 0.47769588232040405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.514150" }, { "step": 4198, "loss": 0.885658860206604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.602071" }, { "step": 4199, "loss": 0.4423518180847168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.689274" }, { "step": 4200, "loss": 0.7402842044830322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.779456" }, { "step": 4201, "loss": 1.0331504344940186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.876491" }, { "step": 4202, "loss": 0.8710715770721436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:47.990152" }, { "step": 4203, "loss": 1.0609954595565796, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.081084" }, { "step": 4204, "loss": 0.5255917906761169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.174000" }, { "step": 4205, "loss": 0.6759344935417175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.260914" }, { "step": 4206, "loss": 0.8134808540344238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.382313" }, { "step": 4207, "loss": 0.9727201461791992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.468791" }, { "step": 4208, "loss": 0.7930160760879517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.581393" }, { "step": 4209, "loss": 0.858220100402832, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.666623" }, { "step": 4210, "loss": 0.5454177260398865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.758456" }, { "step": 4211, "loss": 0.6424260139465332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.843789" }, { "step": 4212, "loss": 0.9870455861091614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:48.928801" }, { "step": 4213, "loss": 0.5606896877288818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.029031" }, { "step": 4214, "loss": 0.9382287263870239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.116275" }, { "step": 4215, "loss": 0.8572368621826172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.229492" }, { "step": 4216, "loss": 0.7889848947525024, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.317066" }, { "step": 4217, "loss": 0.7080368995666504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.411316" }, { "step": 4218, "loss": 0.9105521440505981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.523323" }, { "step": 4219, "loss": 0.8505791425704956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.607930" }, { "step": 4220, "loss": 0.6384017467498779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.726507" }, { "step": 4221, "loss": 0.6516768336296082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.816298" }, { "step": 4222, "loss": 0.7127789258956909, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:49.921760" }, { "step": 4223, "loss": 0.8613489866256714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.030116" }, { "step": 4224, "loss": 0.743548572063446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.150307" }, { "step": 4225, "loss": 0.824352502822876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.246782" }, { "step": 4226, "loss": 0.7139544486999512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.340530" }, { "step": 4227, "loss": 0.5254002213478088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.425484" }, { "step": 4228, "loss": 1.050495982170105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.527409" }, { "step": 4229, "loss": 0.6792393922805786, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.612381" }, { "step": 4230, "loss": 0.8678547739982605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.700499" }, { "step": 4231, "loss": 0.7990873456001282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.786887" }, { "step": 4232, "loss": 0.8441230654716492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.873969" }, { "step": 4233, "loss": 0.7128361463546753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:50.967098" }, { "step": 4234, "loss": 0.789832592010498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.051997" }, { "step": 4235, "loss": 0.5108278393745422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.137919" }, { "step": 4236, "loss": 0.692238450050354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.226217" }, { "step": 4237, "loss": 0.48419618606567383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.311725" }, { "step": 4238, "loss": 0.6671053767204285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.408540" }, { "step": 4239, "loss": 0.6865633130073547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.495797" }, { "step": 4240, "loss": 0.9258293509483337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.580515" }, { "step": 4241, "loss": 0.46618950366973877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.674344" }, { "step": 4242, "loss": 0.5796530246734619, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.770545" }, { "step": 4243, "loss": 0.8370764255523682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.861547" }, { "step": 4244, "loss": 0.5729608535766602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:51.947044" }, { "step": 4245, "loss": 0.3521139919757843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.047565" }, { "step": 4246, "loss": 1.0304549932479858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.133696" }, { "step": 4247, "loss": 0.5334585905075073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.228181" }, { "step": 4248, "loss": 0.6420542001724243, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.347424" }, { "step": 4249, "loss": 0.8521848917007446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.435260" }, { "step": 4250, "loss": 0.9039698839187622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.522147" }, { "step": 4251, "loss": 0.5647283792495728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.620805" }, { "step": 4252, "loss": 0.6056967973709106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.713223" }, { "step": 4253, "loss": 0.7544269561767578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.798207" }, { "step": 4254, "loss": 0.39516574144363403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.894850" }, { "step": 4255, "loss": 0.797440767288208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:52.992118" }, { "step": 4256, "loss": 0.6196009516716003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.077470" }, { "step": 4257, "loss": 0.6001626253128052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.171284" }, { "step": 4258, "loss": 0.3982445299625397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.260169" }, { "step": 4259, "loss": 0.8271297216415405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.375969" }, { "step": 4260, "loss": 0.7964526414871216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.463514" }, { "step": 4261, "loss": 1.0645959377288818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.574702" }, { "step": 4262, "loss": 1.2304837703704834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.689917" }, { "step": 4263, "loss": 0.6239094138145447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.776746" }, { "step": 4264, "loss": 0.6702883243560791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.862802" }, { "step": 4265, "loss": 0.5157583951950073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:53.949985" }, { "step": 4266, "loss": 0.8002297878265381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.061062" }, { "step": 4267, "loss": 0.9026281833648682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.152830" }, { "step": 4268, "loss": 0.8379791975021362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.272199" }, { "step": 4269, "loss": 0.8588365316390991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.379628" }, { "step": 4270, "loss": 0.3479216694831848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.478767" }, { "step": 4271, "loss": 0.8655010461807251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.587975" }, { "step": 4272, "loss": 0.47189444303512573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.686394" }, { "step": 4273, "loss": 0.6578713655471802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.786762" }, { "step": 4274, "loss": 0.7202379703521729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.880426" }, { "step": 4275, "loss": 0.696702241897583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:54.992334" }, { "step": 4276, "loss": 0.6373885869979858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.083250" }, { "step": 4277, "loss": 0.5377643704414368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.176190" }, { "step": 4278, "loss": 0.49751389026641846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.276979" }, { "step": 4279, "loss": 0.5857259631156921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.363215" }, { "step": 4280, "loss": 0.5913466215133667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.448996" }, { "step": 4281, "loss": 0.5950331687927246, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.534253" }, { "step": 4282, "loss": 0.869965136051178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.647723" }, { "step": 4283, "loss": 0.5868836045265198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.736784" }, { "step": 4284, "loss": 0.8246676921844482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.831881" }, { "step": 4285, "loss": 0.7547220587730408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:55.951041" }, { "step": 4286, "loss": 0.5658330917358398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.044383" }, { "step": 4287, "loss": 0.5551161766052246, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.172210" }, { "step": 4288, "loss": 1.0352104902267456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.267682" }, { "step": 4289, "loss": 0.7945176362991333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.380838" }, { "step": 4290, "loss": 0.3685556650161743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.468556" }, { "step": 4291, "loss": 0.8835870027542114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.598303" }, { "step": 4292, "loss": 0.9849673509597778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.693290" }, { "step": 4293, "loss": 0.882844865322113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.779216" }, { "step": 4294, "loss": 0.9585925340652466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.865951" }, { "step": 4295, "loss": 0.6927658319473267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:56.976730" }, { "step": 4296, "loss": 0.664879560470581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.098449" }, { "step": 4297, "loss": 0.49232161045074463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.200208" }, { "step": 4298, "loss": 0.9147530794143677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.291757" }, { "step": 4299, "loss": 0.5293864607810974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.377580" }, { "step": 4300, "loss": 0.7095783948898315, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.480939" }, { "step": 4301, "loss": 0.522017240524292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.572938" }, { "step": 4302, "loss": 0.5157382488250732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.664067" }, { "step": 4303, "loss": 0.6363059282302856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.759514" }, { "step": 4304, "loss": 0.7110946178436279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.857065" }, { "step": 4305, "loss": 0.8563963174819946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:57.945144" }, { "step": 4306, "loss": 0.73280268907547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.071944" }, { "step": 4307, "loss": 0.7595398426055908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.188384" }, { "step": 4308, "loss": 0.6715449094772339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.275520" }, { "step": 4309, "loss": 0.8491821885108948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.386901" }, { "step": 4310, "loss": 1.2654082775115967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.507178" }, { "step": 4311, "loss": 0.9627633094787598, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.596781" }, { "step": 4312, "loss": 0.8596320152282715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.721315" }, { "step": 4313, "loss": 0.5744572877883911, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.814797" }, { "step": 4314, "loss": 0.6828210353851318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:58.909210" }, { "step": 4315, "loss": 0.7571737170219421, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.000982" }, { "step": 4316, "loss": 0.8590049147605896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.114757" }, { "step": 4317, "loss": 0.7097452282905579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.202975" }, { "step": 4318, "loss": 0.592113733291626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.294999" }, { "step": 4319, "loss": 0.810396671295166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.387210" }, { "step": 4320, "loss": 0.40656399726867676, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.480678" }, { "step": 4321, "loss": 0.9538335204124451, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.567883" }, { "step": 4322, "loss": 0.8385850191116333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.679744" }, { "step": 4323, "loss": 1.000894546508789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.770041" }, { "step": 4324, "loss": 0.5891127586364746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.862298" }, { "step": 4325, "loss": 0.8803768157958984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:32:59.946890" }, { "step": 4326, "loss": 0.512547492980957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.037084" }, { "step": 4327, "loss": 0.8626681566238403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.127680" }, { "step": 4328, "loss": 0.6544216275215149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.251105" }, { "step": 4329, "loss": 0.8607130646705627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.344786" }, { "step": 4330, "loss": 0.9435634613037109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.431208" }, { "step": 4331, "loss": 0.6731765270233154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.547205" }, { "step": 4332, "loss": 0.8267129063606262, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.660164" }, { "step": 4333, "loss": 0.6907755136489868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.742217" }, { "step": 4334, "loss": 0.989837646484375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.833218" }, { "step": 4335, "loss": 0.8719937801361084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:00.946190" }, { "step": 4336, "loss": 0.7188292145729065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.063243" }, { "step": 4337, "loss": 0.993767499923706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.175956" }, { "step": 4338, "loss": 0.5952283143997192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.260624" }, { "step": 4339, "loss": 0.7573654651641846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.377654" }, { "step": 4340, "loss": 1.2193406820297241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.465525" }, { "step": 4341, "loss": 0.4681357443332672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.552708" }, { "step": 4342, "loss": 0.39688044786453247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.645725" }, { "step": 4343, "loss": 0.8095057010650635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.762609" }, { "step": 4344, "loss": 0.640727162361145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.853017" }, { "step": 4345, "loss": 0.44124454259872437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:01.942934" }, { "step": 4346, "loss": 0.6586432456970215, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.036046" }, { "step": 4347, "loss": 0.5708425641059875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.160283" }, { "step": 4348, "loss": 0.9373295307159424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.248680" }, { "step": 4349, "loss": 0.9358236789703369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.334104" }, { "step": 4350, "loss": 0.5365274548530579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.427804" }, { "step": 4351, "loss": 0.5498960018157959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.520623" }, { "step": 4352, "loss": 0.8007135391235352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.606923" }, { "step": 4353, "loss": 0.8637694120407104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.692059" }, { "step": 4354, "loss": 0.5956277847290039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.805572" }, { "step": 4355, "loss": 0.6326507925987244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:02.912382" }, { "step": 4356, "loss": 0.6156419515609741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.026344" }, { "step": 4357, "loss": 1.1346652507781982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.138772" }, { "step": 4358, "loss": 0.7661285996437073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.242359" }, { "step": 4359, "loss": 0.570810079574585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.344088" }, { "step": 4360, "loss": 0.460884690284729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.430344" }, { "step": 4361, "loss": 0.9453504085540771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.546207" }, { "step": 4362, "loss": 0.7115743160247803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.633109" }, { "step": 4363, "loss": 0.7401365041732788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.746337" }, { "step": 4364, "loss": 0.4934474229812622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.842307" }, { "step": 4365, "loss": 0.689947783946991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:03.927274" }, { "step": 4366, "loss": 0.4363318085670471, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.011776" }, { "step": 4367, "loss": 0.5405049324035645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.103616" }, { "step": 4368, "loss": 0.5525159239768982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.187735" }, { "step": 4369, "loss": 0.5130691528320312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.282613" }, { "step": 4370, "loss": 0.46462923288345337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.367981" }, { "step": 4371, "loss": 1.205744981765747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.454446" }, { "step": 4372, "loss": 0.423440158367157, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.540997" }, { "step": 4373, "loss": 0.4729984402656555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.628479" }, { "step": 4374, "loss": 0.6655016541481018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.717633" }, { "step": 4375, "loss": 0.5121303796768188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.803800" }, { "step": 4376, "loss": 0.37901896238327026, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:04.896127" }, { "step": 4377, "loss": 0.7709048986434937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.021195" }, { "step": 4378, "loss": 0.6606408357620239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.137420" }, { "step": 4379, "loss": 1.0581856966018677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.226955" }, { "step": 4380, "loss": 0.30103933811187744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.317118" }, { "step": 4381, "loss": 0.6540720462799072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.405323" }, { "step": 4382, "loss": 1.1443668603897095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.532930" }, { "step": 4383, "loss": 0.5629042387008667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.627372" }, { "step": 4384, "loss": 0.4378853440284729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.740735" }, { "step": 4385, "loss": 0.7639929056167603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.824916" }, { "step": 4386, "loss": 0.4349641799926758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:05.923826" }, { "step": 4387, "loss": 0.5751827955245972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.016918" }, { "step": 4388, "loss": 0.4022147059440613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.102121" }, { "step": 4389, "loss": 0.5678647756576538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.209147" }, { "step": 4390, "loss": 0.5268075466156006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.300619" }, { "step": 4391, "loss": 0.6089509725570679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.386261" }, { "step": 4392, "loss": 0.5552861094474792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.477094" }, { "step": 4393, "loss": 0.356047660112381, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.576806" }, { "step": 4394, "loss": 0.8515894412994385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.665212" }, { "step": 4395, "loss": 0.4857677221298218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.756861" }, { "step": 4396, "loss": 0.5743920207023621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.845709" }, { "step": 4397, "loss": 0.4715458154678345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:06.932944" }, { "step": 4398, "loss": 0.8763116598129272, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.023707" }, { "step": 4399, "loss": 0.4552711248397827, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.110565" }, { "step": 4400, "loss": 0.5860386490821838, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.204809" }, { "step": 4401, "loss": 0.8158529996871948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.298702" }, { "step": 4402, "loss": 0.4334377646446228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.392731" }, { "step": 4403, "loss": 0.6628870964050293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.485307" }, { "step": 4404, "loss": 0.4274843633174896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.577175" }, { "step": 4405, "loss": 0.7728078365325928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.691967" }, { "step": 4406, "loss": 0.5647032856941223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.784408" }, { "step": 4407, "loss": 0.5819523334503174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.872425" }, { "step": 4408, "loss": 0.5751702189445496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:07.958562" }, { "step": 4409, "loss": 0.6248139142990112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.045108" }, { "step": 4410, "loss": 0.6288192868232727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.152214" }, { "step": 4411, "loss": 0.7150739431381226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.240914" }, { "step": 4412, "loss": 0.46487218141555786, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.325200" }, { "step": 4413, "loss": 0.7997291088104248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.431171" }, { "step": 4414, "loss": 0.6104859709739685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.516836" }, { "step": 4415, "loss": 0.6374920606613159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.608807" }, { "step": 4416, "loss": 0.409280925989151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.704414" }, { "step": 4417, "loss": 0.6721562147140503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.820287" }, { "step": 4418, "loss": 1.0293081998825073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:08.905788" }, { "step": 4419, "loss": 0.8954026103019714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.000150" }, { "step": 4420, "loss": 0.6505874395370483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.111769" }, { "step": 4421, "loss": 0.7672909498214722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.225063" }, { "step": 4422, "loss": 0.6359696984291077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.314697" }, { "step": 4423, "loss": 0.7470318078994751, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.399759" }, { "step": 4424, "loss": 0.4980388581752777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.489831" }, { "step": 4425, "loss": 0.4921974837779999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.574621" }, { "step": 4426, "loss": 0.6190827488899231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.660180" }, { "step": 4427, "loss": 0.697561502456665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.757032" }, { "step": 4428, "loss": 0.5370991230010986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.843948" }, { "step": 4429, "loss": 0.4449580907821655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:09.932962" }, { "step": 4430, "loss": 0.897764265537262, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.029842" }, { "step": 4431, "loss": 0.8626962900161743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.115000" }, { "step": 4432, "loss": 0.597116231918335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.234130" }, { "step": 4433, "loss": 0.35983651876449585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.326989" }, { "step": 4434, "loss": 0.5022519826889038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.422983" }, { "step": 4435, "loss": 0.8877780437469482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.536234" }, { "step": 4436, "loss": 0.5101726055145264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.629231" }, { "step": 4437, "loss": 0.9533103704452515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.725108" }, { "step": 4438, "loss": 0.43701767921447754, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.816301" }, { "step": 4439, "loss": 0.8100862503051758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:10.930911" }, { "step": 4440, "loss": 0.6079700589179993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.016589" }, { "step": 4441, "loss": 0.9016113877296448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.105329" }, { "step": 4442, "loss": 0.7061419486999512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.250390" }, { "step": 4443, "loss": 0.5908485054969788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.341995" }, { "step": 4444, "loss": 0.7863566279411316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.463473" }, { "step": 4445, "loss": 0.5729598999023438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.560645" }, { "step": 4446, "loss": 0.4370667040348053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.650213" }, { "step": 4447, "loss": 0.6164653301239014, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.749889" }, { "step": 4448, "loss": 0.6385836601257324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.838048" }, { "step": 4449, "loss": 0.34244391322135925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:11.941901" }, { "step": 4450, "loss": 0.5049639940261841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.034285" }, { "step": 4451, "loss": 0.5032544732093811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.154321" }, { "step": 4452, "loss": 0.6864284873008728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.248196" }, { "step": 4453, "loss": 0.6430437564849854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.333525" }, { "step": 4454, "loss": 0.8302949070930481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.450766" }, { "step": 4455, "loss": 0.7035237550735474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.566829" }, { "step": 4456, "loss": 0.40915772318840027, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.664057" }, { "step": 4457, "loss": 0.4789721369743347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.760989" }, { "step": 4458, "loss": 0.7056089639663696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.856641" }, { "step": 4459, "loss": 0.4773213863372803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:12.951819" }, { "step": 4460, "loss": 0.9759652614593506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.069730" }, { "step": 4461, "loss": 0.5017484426498413, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.189174" }, { "step": 4462, "loss": 0.8604616522789001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.287878" }, { "step": 4463, "loss": 0.5602333545684814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.374061" }, { "step": 4464, "loss": 0.8669891357421875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.488693" }, { "step": 4465, "loss": 0.6441047191619873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.575382" }, { "step": 4466, "loss": 0.43321385979652405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.661344" }, { "step": 4467, "loss": 0.7118913531303406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.746059" }, { "step": 4468, "loss": 0.6425536274909973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.831508" }, { "step": 4469, "loss": 0.34983760118484497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:13.919434" }, { "step": 4470, "loss": 0.7558490633964539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.006144" }, { "step": 4471, "loss": 0.7575470209121704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.116979" }, { "step": 4472, "loss": 0.5213481783866882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.203174" }, { "step": 4473, "loss": 0.791479766368866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.328658" }, { "step": 4474, "loss": 0.35250604152679443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.423443" }, { "step": 4475, "loss": 0.7951623201370239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.517338" }, { "step": 4476, "loss": 0.9587668180465698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.633414" }, { "step": 4477, "loss": 1.0354998111724854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.727990" }, { "step": 4478, "loss": 0.4626592695713043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.821460" }, { "step": 4479, "loss": 0.4919637143611908, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:14.914108" }, { "step": 4480, "loss": 0.5352931022644043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.000963" }, { "step": 4481, "loss": 0.8126494288444519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.087990" }, { "step": 4482, "loss": 0.5629255175590515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.197032" }, { "step": 4483, "loss": 0.9839394092559814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.286404" }, { "step": 4484, "loss": 0.848615288734436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.403802" }, { "step": 4485, "loss": 0.5547665357589722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.495520" }, { "step": 4486, "loss": 0.5515184998512268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.587339" }, { "step": 4487, "loss": 0.6710628271102905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.672282" }, { "step": 4488, "loss": 0.6086810827255249, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.774966" }, { "step": 4489, "loss": 0.3138313591480255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.867051" }, { "step": 4490, "loss": 0.8759921789169312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:15.951981" }, { "step": 4491, "loss": 0.6350056529045105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.069147" }, { "step": 4492, "loss": 0.6467010974884033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.187346" }, { "step": 4493, "loss": 0.5905323028564453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.273267" }, { "step": 4494, "loss": 0.9440011382102966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.359057" }, { "step": 4495, "loss": 0.4441070258617401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.443718" }, { "step": 4496, "loss": 0.6232788562774658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.531080" }, { "step": 4497, "loss": 0.453496515750885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.625314" }, { "step": 4498, "loss": 0.9410767555236816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.720288" }, { "step": 4499, "loss": 0.5489144325256348, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.806829" }, { "step": 4500, "loss": 0.700005054473877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:16.895362" }, { "step": 4501, "loss": 0.5993916988372803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:39.687347" }, { "step": 4502, "loss": 0.39819595217704773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:39.808137" }, { "step": 4503, "loss": 0.38894376158714294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:39.903287" }, { "step": 4504, "loss": 0.615291953086853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:39.995903" }, { "step": 4505, "loss": 0.7054672241210938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.107903" }, { "step": 4506, "loss": 0.9594279527664185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.198401" }, { "step": 4507, "loss": 0.5543255805969238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.297338" }, { "step": 4508, "loss": 0.3810095191001892, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.394406" }, { "step": 4509, "loss": 0.7616061568260193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.508598" }, { "step": 4510, "loss": 0.5127065181732178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.598637" }, { "step": 4511, "loss": 0.9454849362373352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.687254" }, { "step": 4512, "loss": 0.5246887803077698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.778546" }, { "step": 4513, "loss": 0.8988473415374756, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.888246" }, { "step": 4514, "loss": 0.8997325301170349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:40.977710" }, { "step": 4515, "loss": 0.5730422735214233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.076130" }, { "step": 4516, "loss": 0.7939547300338745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.160146" }, { "step": 4517, "loss": 0.7268772125244141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.246790" }, { "step": 4518, "loss": 0.7470512390136719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.367663" }, { "step": 4519, "loss": 0.5599604845046997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.460993" }, { "step": 4520, "loss": 0.9345430135726929, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.568802" }, { "step": 4521, "loss": 0.408156156539917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.654348" }, { "step": 4522, "loss": 0.7429453134536743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.745904" }, { "step": 4523, "loss": 0.6472257375717163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.837868" }, { "step": 4524, "loss": 0.4857312738895416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:41.934197" }, { "step": 4525, "loss": 0.3531578779220581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.031038" }, { "step": 4526, "loss": 0.5100153684616089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.123064" }, { "step": 4527, "loss": 0.598386287689209, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.214920" }, { "step": 4528, "loss": 0.5456607937812805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.307486" }, { "step": 4529, "loss": 0.81768399477005, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.403663" }, { "step": 4530, "loss": 0.3020312786102295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.488660" }, { "step": 4531, "loss": 0.8466737866401672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.581326" }, { "step": 4532, "loss": 0.4739243984222412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.668243" }, { "step": 4533, "loss": 0.5074892044067383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.760373" }, { "step": 4534, "loss": 0.6033821702003479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.879748" }, { "step": 4535, "loss": 0.48342788219451904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:42.972490" }, { "step": 4536, "loss": 0.9171985387802124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.112234" }, { "step": 4537, "loss": 0.40471351146698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.199991" }, { "step": 4538, "loss": 0.5680427551269531, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.294237" }, { "step": 4539, "loss": 0.7492805123329163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.378849" }, { "step": 4540, "loss": 0.6051138639450073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.465182" }, { "step": 4541, "loss": 0.6289836764335632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.559032" }, { "step": 4542, "loss": 0.5879309773445129, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.649653" }, { "step": 4543, "loss": 0.39331454038619995, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.742712" }, { "step": 4544, "loss": 0.6128024458885193, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.855664" }, { "step": 4545, "loss": 0.9141513109207153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:43.941750" }, { "step": 4546, "loss": 0.8147004842758179, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.026798" }, { "step": 4547, "loss": 0.34723129868507385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.116400" }, { "step": 4548, "loss": 0.8143356442451477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.202480" }, { "step": 4549, "loss": 0.5862226486206055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.300147" }, { "step": 4550, "loss": 0.5010809898376465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.386263" }, { "step": 4551, "loss": 0.680986225605011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.516416" }, { "step": 4552, "loss": 0.33785441517829895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.602550" }, { "step": 4553, "loss": 0.5071364641189575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.693941" }, { "step": 4554, "loss": 0.7099546790122986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.803592" }, { "step": 4555, "loss": 0.4107416570186615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.893457" }, { "step": 4556, "loss": 0.49583685398101807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:44.978377" }, { "step": 4557, "loss": 0.6561521887779236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.091142" }, { "step": 4558, "loss": 0.6133583784103394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.184946" }, { "step": 4559, "loss": 0.5261045694351196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.281204" }, { "step": 4560, "loss": 0.6264874935150146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.370563" }, { "step": 4561, "loss": 0.9169460535049438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.489330" }, { "step": 4562, "loss": 0.43673765659332275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.575355" }, { "step": 4563, "loss": 0.48179924488067627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.677384" }, { "step": 4564, "loss": 0.7624706029891968, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.782985" }, { "step": 4565, "loss": 0.3472733199596405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.879810" }, { "step": 4566, "loss": 1.0822088718414307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:45.991782" }, { "step": 4567, "loss": 0.6766489744186401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.099930" }, { "step": 4568, "loss": 0.7153181433677673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.190640" }, { "step": 4569, "loss": 0.6145076155662537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.289835" }, { "step": 4570, "loss": 0.6375904083251953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.405389" }, { "step": 4571, "loss": 0.5546172261238098, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.494868" }, { "step": 4572, "loss": 0.3625958561897278, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.587154" }, { "step": 4573, "loss": 0.6289509534835815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.681802" }, { "step": 4574, "loss": 0.9007325172424316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.793775" }, { "step": 4575, "loss": 0.7736178636550903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.886988" }, { "step": 4576, "loss": 0.5381861925125122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:46.983902" }, { "step": 4577, "loss": 0.6518550515174866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.069036" }, { "step": 4578, "loss": 0.7232439517974854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.163524" }, { "step": 4579, "loss": 0.5923999547958374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.251687" }, { "step": 4580, "loss": 0.7761327028274536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.336344" }, { "step": 4581, "loss": 0.7214019298553467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.421761" }, { "step": 4582, "loss": 0.4854578375816345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.513617" }, { "step": 4583, "loss": 0.6078163385391235, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.599796" }, { "step": 4584, "loss": 0.8780027627944946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.685856" }, { "step": 4585, "loss": 0.522311806678772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.774789" }, { "step": 4586, "loss": 0.6167858242988586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.863251" }, { "step": 4587, "loss": 0.47062671184539795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:47.955696" }, { "step": 4588, "loss": 0.8082189559936523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.044190" }, { "step": 4589, "loss": 0.6485718488693237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.133977" }, { "step": 4590, "loss": 0.8347097635269165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.248443" }, { "step": 4591, "loss": 0.8959800601005554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.387558" }, { "step": 4592, "loss": 0.8487670421600342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.473576" }, { "step": 4593, "loss": 0.7864790558815002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.597088" }, { "step": 4594, "loss": 0.670312762260437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.708327" }, { "step": 4595, "loss": 0.8714357614517212, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.794572" }, { "step": 4596, "loss": 0.874374270439148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.880551" }, { "step": 4597, "loss": 0.6780912280082703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:48.971992" }, { "step": 4598, "loss": 0.8213457465171814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.056909" }, { "step": 4599, "loss": 0.6422121524810791, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.155774" }, { "step": 4600, "loss": 0.6723579168319702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.240529" }, { "step": 4601, "loss": 0.3911513686180115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.354691" }, { "step": 4602, "loss": 0.4875815510749817, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.457213" }, { "step": 4603, "loss": 0.5885405540466309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.549662" }, { "step": 4604, "loss": 0.7909751534461975, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.642310" }, { "step": 4605, "loss": 0.5386859178543091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.753115" }, { "step": 4606, "loss": 0.8262953758239746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.839271" }, { "step": 4607, "loss": 0.5821189284324646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:49.932461" }, { "step": 4608, "loss": 0.7232680320739746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.017990" }, { "step": 4609, "loss": 0.5865445137023926, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.115575" }, { "step": 4610, "loss": 0.4776439070701599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.200227" }, { "step": 4611, "loss": 0.8281660079956055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.318099" }, { "step": 4612, "loss": 0.4336768388748169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.410610" }, { "step": 4613, "loss": 0.7653867602348328, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.501934" }, { "step": 4614, "loss": 0.7590848803520203, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.602838" }, { "step": 4615, "loss": 0.43119895458221436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.695916" }, { "step": 4616, "loss": 0.7177728414535522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.786023" }, { "step": 4617, "loss": 0.9818204641342163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.895612" }, { "step": 4618, "loss": 0.622050404548645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:50.993313" }, { "step": 4619, "loss": 0.7484825253486633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.086735" }, { "step": 4620, "loss": 0.45480525493621826, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.201655" }, { "step": 4621, "loss": 0.6866896152496338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.316592" }, { "step": 4622, "loss": 0.7369660139083862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.404832" }, { "step": 4623, "loss": 1.0068135261535645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.514067" }, { "step": 4624, "loss": 0.6209254860877991, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.599440" }, { "step": 4625, "loss": 0.5629585981369019, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.687552" }, { "step": 4626, "loss": 0.8993641138076782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.774622" }, { "step": 4627, "loss": 0.7293583154678345, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.861427" }, { "step": 4628, "loss": 0.36740970611572266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:51.949475" }, { "step": 4629, "loss": 0.6025190353393555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.034842" }, { "step": 4630, "loss": 0.6698351502418518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.127430" }, { "step": 4631, "loss": 0.6301352381706238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.214838" }, { "step": 4632, "loss": 0.6522918343544006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.300623" }, { "step": 4633, "loss": 0.4751187562942505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.393898" }, { "step": 4634, "loss": 0.6519132256507874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.489089" }, { "step": 4635, "loss": 0.7766544818878174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.575254" }, { "step": 4636, "loss": 0.6021887063980103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.686472" }, { "step": 4637, "loss": 0.8416724801063538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.781269" }, { "step": 4638, "loss": 0.5232183933258057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.876229" }, { "step": 4639, "loss": 1.0272201299667358, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:52.969923" }, { "step": 4640, "loss": 0.7609634399414062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.056908" }, { "step": 4641, "loss": 0.4089134931564331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.153672" }, { "step": 4642, "loss": 0.7818801403045654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.261164" }, { "step": 4643, "loss": 0.8683321475982666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.349697" }, { "step": 4644, "loss": 0.467867910861969, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.435527" }, { "step": 4645, "loss": 0.8378889560699463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.520155" }, { "step": 4646, "loss": 0.7982330918312073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.636300" }, { "step": 4647, "loss": 0.7177354097366333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.728534" }, { "step": 4648, "loss": 0.4876829981803894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.823051" }, { "step": 4649, "loss": 0.5694680213928223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:53.915678" }, { "step": 4650, "loss": 0.7336537837982178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.002124" }, { "step": 4651, "loss": 0.45213913917541504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.089070" }, { "step": 4652, "loss": 0.4774692952632904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.182272" }, { "step": 4653, "loss": 1.0784876346588135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.266988" }, { "step": 4654, "loss": 0.6361704468727112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.381196" }, { "step": 4655, "loss": 0.5737269520759583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.468051" }, { "step": 4656, "loss": 0.7246129512786865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.562525" }, { "step": 4657, "loss": 0.5183422565460205, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.662248" }, { "step": 4658, "loss": 0.3975881338119507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.756770" }, { "step": 4659, "loss": 0.5858864784240723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.875120" }, { "step": 4660, "loss": 0.6289893388748169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:54.961608" }, { "step": 4661, "loss": 0.6600990295410156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.053109" }, { "step": 4662, "loss": 0.38084447383880615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.145360" }, { "step": 4663, "loss": 0.5261474847793579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.231648" }, { "step": 4664, "loss": 0.3622162938117981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.353495" }, { "step": 4665, "loss": 0.6055880784988403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.447918" }, { "step": 4666, "loss": 0.41879063844680786, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.536852" }, { "step": 4667, "loss": 0.4913090467453003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.623650" }, { "step": 4668, "loss": 0.5396468043327332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.740411" }, { "step": 4669, "loss": 0.733421802520752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.859943" }, { "step": 4670, "loss": 0.5591832399368286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:55.944794" }, { "step": 4671, "loss": 0.6260520815849304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.042197" }, { "step": 4672, "loss": 0.8667356371879578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.154404" }, { "step": 4673, "loss": 1.0128848552703857, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.246688" }, { "step": 4674, "loss": 0.8337464332580566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.336312" }, { "step": 4675, "loss": 0.42239370942115784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.421938" }, { "step": 4676, "loss": 0.6444863080978394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.514328" }, { "step": 4677, "loss": 0.5784633755683899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.626207" }, { "step": 4678, "loss": 0.7047000527381897, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.722066" }, { "step": 4679, "loss": 0.594609260559082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.804406" }, { "step": 4680, "loss": 0.5911743640899658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.894055" }, { "step": 4681, "loss": 0.46164828538894653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:56.989374" }, { "step": 4682, "loss": 0.6354186534881592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.078466" }, { "step": 4683, "loss": 0.5399905443191528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.169206" }, { "step": 4684, "loss": 0.5106227397918701, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.290192" }, { "step": 4685, "loss": 0.8128166794776917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.381906" }, { "step": 4686, "loss": 0.6065137386322021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.468339" }, { "step": 4687, "loss": 0.7846897840499878, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.557790" }, { "step": 4688, "loss": 0.4804084002971649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.650409" }, { "step": 4689, "loss": 0.5983918905258179, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.737812" }, { "step": 4690, "loss": 0.8099642992019653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.823307" }, { "step": 4691, "loss": 0.5829170346260071, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.912527" }, { "step": 4692, "loss": 0.7212488651275635, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:57.999400" }, { "step": 4693, "loss": 0.6834396123886108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.091207" }, { "step": 4694, "loss": 0.6368234157562256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.175995" }, { "step": 4695, "loss": 0.8630056381225586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.287893" }, { "step": 4696, "loss": 0.39391112327575684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.383409" }, { "step": 4697, "loss": 0.59542316198349, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.469326" }, { "step": 4698, "loss": 0.5083194971084595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.557847" }, { "step": 4699, "loss": 0.7129775285720825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.646703" }, { "step": 4700, "loss": 0.6734091639518738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.769649" }, { "step": 4701, "loss": 0.5988492369651794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.861137" }, { "step": 4702, "loss": 1.398263692855835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:58.947534" }, { "step": 4703, "loss": 0.45861923694610596, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.035052" }, { "step": 4704, "loss": 0.6044206619262695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.119592" }, { "step": 4705, "loss": 0.9830602407455444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.216408" }, { "step": 4706, "loss": 0.45198383927345276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.303423" }, { "step": 4707, "loss": 0.5290166735649109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.390443" }, { "step": 4708, "loss": 0.5029173493385315, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.484470" }, { "step": 4709, "loss": 0.5283526182174683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.570363" }, { "step": 4710, "loss": 0.3786487281322479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.657982" }, { "step": 4711, "loss": 0.5871321558952332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.743128" }, { "step": 4712, "loss": 0.6651433110237122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.837103" }, { "step": 4713, "loss": 0.26556432247161865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:33:59.923057" }, { "step": 4714, "loss": 0.5890644192695618, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.013526" }, { "step": 4715, "loss": 0.38922321796417236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.098777" }, { "step": 4716, "loss": 0.9759541153907776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.207935" }, { "step": 4717, "loss": 0.49884796142578125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.294035" }, { "step": 4718, "loss": 0.9632370471954346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.379590" }, { "step": 4719, "loss": 0.6150012016296387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.484453" }, { "step": 4720, "loss": 0.8039739727973938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.569820" }, { "step": 4721, "loss": 0.8927119374275208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.655077" }, { "step": 4722, "loss": 0.6912765502929688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.772965" }, { "step": 4723, "loss": 0.5740548968315125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.863221" }, { "step": 4724, "loss": 0.5822540521621704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:00.978307" }, { "step": 4725, "loss": 0.7010749578475952, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.063478" }, { "step": 4726, "loss": 0.49047204852104187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.155483" }, { "step": 4727, "loss": 0.8179123401641846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.265048" }, { "step": 4728, "loss": 0.3040582239627838, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.364256" }, { "step": 4729, "loss": 0.4686351418495178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.474363" }, { "step": 4730, "loss": 0.7630886435508728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.564379" }, { "step": 4731, "loss": 0.7592250108718872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.658464" }, { "step": 4732, "loss": 0.6979917883872986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.768891" }, { "step": 4733, "loss": 0.5066667795181274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.853649" }, { "step": 4734, "loss": 0.5406472086906433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:01.961243" }, { "step": 4735, "loss": 0.6177148818969727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.057224" }, { "step": 4736, "loss": 0.6035199165344238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.142777" }, { "step": 4737, "loss": 0.4974743127822876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.234910" }, { "step": 4738, "loss": 0.4990059733390808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.320899" }, { "step": 4739, "loss": 0.8198952078819275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.439321" }, { "step": 4740, "loss": 0.7343868017196655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.523809" }, { "step": 4741, "loss": 0.6389904618263245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.619836" }, { "step": 4742, "loss": 0.718293309211731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.730616" }, { "step": 4743, "loss": 0.7258696556091309, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.817943" }, { "step": 4744, "loss": 0.9373030662536621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.903220" }, { "step": 4745, "loss": 0.466278612613678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:02.987424" }, { "step": 4746, "loss": 0.569675862789154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.076915" }, { "step": 4747, "loss": 0.6560466289520264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.164375" }, { "step": 4748, "loss": 0.8675031661987305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.285933" }, { "step": 4749, "loss": 0.47471433877944946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.384219" }, { "step": 4750, "loss": 0.42209526896476746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.470074" }, { "step": 4751, "loss": 0.40512633323669434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.594185" }, { "step": 4752, "loss": 0.5865883827209473, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.680064" }, { "step": 4753, "loss": 0.8149303793907166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.775516" }, { "step": 4754, "loss": 0.6326409578323364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.861220" }, { "step": 4755, "loss": 0.6459879875183105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:03.953963" }, { "step": 4756, "loss": 0.987429678440094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.047129" }, { "step": 4757, "loss": 0.6699205636978149, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.158381" }, { "step": 4758, "loss": 0.8128054141998291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.251830" }, { "step": 4759, "loss": 0.5322607755661011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.363650" }, { "step": 4760, "loss": 0.5706865787506104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.451779" }, { "step": 4761, "loss": 0.6876170635223389, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.543948" }, { "step": 4762, "loss": 0.5604346990585327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.633944" }, { "step": 4763, "loss": 0.44223660230636597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.730989" }, { "step": 4764, "loss": 0.6998351216316223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.848500" }, { "step": 4765, "loss": 0.25963568687438965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:04.940388" }, { "step": 4766, "loss": 0.6101844310760498, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.026184" }, { "step": 4767, "loss": 0.6832072734832764, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.143026" }, { "step": 4768, "loss": 0.9513390064239502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.230419" }, { "step": 4769, "loss": 0.37626779079437256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.322300" }, { "step": 4770, "loss": 0.7185952663421631, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.413764" }, { "step": 4771, "loss": 0.5147793889045715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.498876" }, { "step": 4772, "loss": 0.6524436473846436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.587009" }, { "step": 4773, "loss": 0.5091190934181213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.680389" }, { "step": 4774, "loss": 0.7782458662986755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.767012" }, { "step": 4775, "loss": 0.47473257780075073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.853937" }, { "step": 4776, "loss": 0.27372628450393677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:05.943213" }, { "step": 4777, "loss": 0.637036919593811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.028211" }, { "step": 4778, "loss": 0.6784029006958008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.119976" }, { "step": 4779, "loss": 0.5661840438842773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.240666" }, { "step": 4780, "loss": 0.45196110010147095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.326199" }, { "step": 4781, "loss": 1.00118088722229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.422679" }, { "step": 4782, "loss": 0.7859467267990112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.546654" }, { "step": 4783, "loss": 0.9852415323257446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.651479" }, { "step": 4784, "loss": 0.5347015857696533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.737997" }, { "step": 4785, "loss": 0.6668683290481567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.846516" }, { "step": 4786, "loss": 0.8139182329177856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:06.958381" }, { "step": 4787, "loss": 0.6357852220535278, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.073476" }, { "step": 4788, "loss": 0.9373699426651001, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.183841" }, { "step": 4789, "loss": 0.636122465133667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.275237" }, { "step": 4790, "loss": 1.0187816619873047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.393588" }, { "step": 4791, "loss": 0.9263008832931519, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.502651" }, { "step": 4792, "loss": 0.6031620502471924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.589915" }, { "step": 4793, "loss": 0.7280694842338562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.696928" }, { "step": 4794, "loss": 0.49572837352752686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.790169" }, { "step": 4795, "loss": 0.5959998369216919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.880342" }, { "step": 4796, "loss": 0.7016143202781677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:07.993603" }, { "step": 4797, "loss": 0.9361352324485779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.118755" }, { "step": 4798, "loss": 0.5767486691474915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.219227" }, { "step": 4799, "loss": 0.8335438370704651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.334271" }, { "step": 4800, "loss": 0.73659747838974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.446216" }, { "step": 4801, "loss": 0.8759230375289917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.544992" }, { "step": 4802, "loss": 0.5963420271873474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.630001" }, { "step": 4803, "loss": 0.40294718742370605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.717959" }, { "step": 4804, "loss": 0.6518760919570923, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.807485" }, { "step": 4805, "loss": 0.43018001317977905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.899999" }, { "step": 4806, "loss": 0.6095156073570251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:08.983182" }, { "step": 4807, "loss": 0.5468474626541138, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.075780" }, { "step": 4808, "loss": 0.8386721611022949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.159892" }, { "step": 4809, "loss": 0.8641980886459351, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.284016" }, { "step": 4810, "loss": 0.8894654512405396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.379847" }, { "step": 4811, "loss": 0.7083070278167725, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.467567" }, { "step": 4812, "loss": 0.5538305640220642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.553791" }, { "step": 4813, "loss": 0.28800705075263977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.638904" }, { "step": 4814, "loss": 0.9083583354949951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.723784" }, { "step": 4815, "loss": 0.6762903928756714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.813107" }, { "step": 4816, "loss": 0.4568333625793457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.912996" }, { "step": 4817, "loss": 0.9642212390899658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:09.999063" }, { "step": 4818, "loss": 0.8917081356048584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.121850" }, { "step": 4819, "loss": 0.8120609521865845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.209501" }, { "step": 4820, "loss": 0.7568103075027466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.325201" }, { "step": 4821, "loss": 0.5471818447113037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.409701" }, { "step": 4822, "loss": 0.7567867040634155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.495842" }, { "step": 4823, "loss": 0.6620160341262817, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.616980" }, { "step": 4824, "loss": 0.7521164417266846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.729308" }, { "step": 4825, "loss": 0.8846526741981506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.842816" }, { "step": 4826, "loss": 0.7034571170806885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:10.935545" }, { "step": 4827, "loss": 0.7673000693321228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.020810" }, { "step": 4828, "loss": 0.3264208734035492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.116541" }, { "step": 4829, "loss": 0.8601971864700317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.247204" }, { "step": 4830, "loss": 0.40322256088256836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.343232" }, { "step": 4831, "loss": 1.0025851726531982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.434486" }, { "step": 4832, "loss": 0.786175549030304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.527140" }, { "step": 4833, "loss": 0.771054208278656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.615020" }, { "step": 4834, "loss": 0.38203439116477966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.701390" }, { "step": 4835, "loss": 0.8172411918640137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.794041" }, { "step": 4836, "loss": 0.4159138798713684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.879021" }, { "step": 4837, "loss": 1.171483039855957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:11.970327" }, { "step": 4838, "loss": 0.8218741416931152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.056644" }, { "step": 4839, "loss": 0.49849817156791687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.148902" }, { "step": 4840, "loss": 0.7536492347717285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.286716" }, { "step": 4841, "loss": 0.7096771597862244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.376592" }, { "step": 4842, "loss": 0.6603878736495972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.469650" }, { "step": 4843, "loss": 0.588475227355957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.557612" }, { "step": 4844, "loss": 0.6624993085861206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.643227" }, { "step": 4845, "loss": 0.5585310459136963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.735548" }, { "step": 4846, "loss": 0.6932848691940308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.824743" }, { "step": 4847, "loss": 0.6904866099357605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:12.918514" }, { "step": 4848, "loss": 0.5097074508666992, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.007615" }, { "step": 4849, "loss": 0.48242777585983276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.106525" }, { "step": 4850, "loss": 0.8165359497070312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.196488" }, { "step": 4851, "loss": 0.9573872089385986, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.288368" }, { "step": 4852, "loss": 0.49265798926353455, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.380354" }, { "step": 4853, "loss": 0.5577799677848816, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.484057" }, { "step": 4854, "loss": 0.8403815031051636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.570177" }, { "step": 4855, "loss": 0.27713343501091003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.660005" }, { "step": 4856, "loss": 0.9847837686538696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.780800" }, { "step": 4857, "loss": 0.554195761680603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.871525" }, { "step": 4858, "loss": 0.7247843742370605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:13.966068" }, { "step": 4859, "loss": 0.5249608159065247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.213232" }, { "step": 4860, "loss": 0.5424925088882446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.307878" }, { "step": 4861, "loss": 0.8913729786872864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.427651" }, { "step": 4862, "loss": 0.9263691902160645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.519343" }, { "step": 4863, "loss": 0.9089317321777344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.604117" }, { "step": 4864, "loss": 0.6810064315795898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.718296" }, { "step": 4865, "loss": 0.8960052728652954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.810881" }, { "step": 4866, "loss": 0.6618267893791199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.896349" }, { "step": 4867, "loss": 0.5342263579368591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:14.988480" }, { "step": 4868, "loss": 0.41671204566955566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.082110" }, { "step": 4869, "loss": 0.38900184631347656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.167793" }, { "step": 4870, "loss": 0.5313588380813599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.259370" }, { "step": 4871, "loss": 0.6123418211936951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.344530" }, { "step": 4872, "loss": 0.6907559037208557, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.432675" }, { "step": 4873, "loss": 0.585949182510376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.527062" }, { "step": 4874, "loss": 0.6403979659080505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.611614" }, { "step": 4875, "loss": 0.38878658413887024, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.698638" }, { "step": 4876, "loss": 0.5150213241577148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.791815" }, { "step": 4877, "loss": 0.6308550238609314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:15.909599" }, { "step": 4878, "loss": 0.9061298370361328, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.023003" }, { "step": 4879, "loss": 0.896905779838562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.117648" }, { "step": 4880, "loss": 0.5401101112365723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.219032" }, { "step": 4881, "loss": 0.9314677119255066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.304044" }, { "step": 4882, "loss": 0.3855844736099243, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.398136" }, { "step": 4883, "loss": 0.5918634533882141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.490286" }, { "step": 4884, "loss": 0.331856369972229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.586356" }, { "step": 4885, "loss": 0.8515456318855286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.672314" }, { "step": 4886, "loss": 0.6489855051040649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.763854" }, { "step": 4887, "loss": 0.42113178968429565, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.856115" }, { "step": 4888, "loss": 0.6555677056312561, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:16.966110" }, { "step": 4889, "loss": 0.5628352761268616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.057944" }, { "step": 4890, "loss": 0.4291691780090332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.151823" }, { "step": 4891, "loss": 0.5312947034835815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.274801" }, { "step": 4892, "loss": 0.4670565128326416, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.363112" }, { "step": 4893, "loss": 0.6511622667312622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.449020" }, { "step": 4894, "loss": 0.7455966472625732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.535593" }, { "step": 4895, "loss": 0.701849102973938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.654201" }, { "step": 4896, "loss": 0.446536123752594, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.739476" }, { "step": 4897, "loss": 0.8681905269622803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.856552" }, { "step": 4898, "loss": 0.7346495389938354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:17.948227" }, { "step": 4899, "loss": 0.5020308494567871, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.045829" }, { "step": 4900, "loss": 0.5536429286003113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.163776" }, { "step": 4901, "loss": 0.5008077025413513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.256285" }, { "step": 4902, "loss": 0.7578904628753662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.343031" }, { "step": 4903, "loss": 1.0312392711639404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.432072" }, { "step": 4904, "loss": 0.7820578813552856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.542352" }, { "step": 4905, "loss": 0.335417777299881, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.628159" }, { "step": 4906, "loss": 0.6276026964187622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.714577" }, { "step": 4907, "loss": 0.520710289478302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.800397" }, { "step": 4908, "loss": 0.5678018927574158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.895248" }, { "step": 4909, "loss": 0.2430700957775116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:18.986986" }, { "step": 4910, "loss": 0.38610124588012695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.087019" }, { "step": 4911, "loss": 0.6927369236946106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.175253" }, { "step": 4912, "loss": 0.8530865907669067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.304602" }, { "step": 4913, "loss": 0.8604004979133606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.392004" }, { "step": 4914, "loss": 0.4708212912082672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.483504" }, { "step": 4915, "loss": 0.456662654876709, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.568295" }, { "step": 4916, "loss": 0.8033172488212585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.681969" }, { "step": 4917, "loss": 0.784442126750946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.769560" }, { "step": 4918, "loss": 0.7484562993049622, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.862659" }, { "step": 4919, "loss": 0.567510724067688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:19.948919" }, { "step": 4920, "loss": 0.8703858852386475, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.048474" }, { "step": 4921, "loss": 0.7015682458877563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.160455" }, { "step": 4922, "loss": 0.5963343381881714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.245833" }, { "step": 4923, "loss": 0.6670812964439392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.331145" }, { "step": 4924, "loss": 0.5081415176391602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.419293" }, { "step": 4925, "loss": 0.6025235056877136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.512485" }, { "step": 4926, "loss": 0.7574318647384644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.604858" }, { "step": 4927, "loss": 0.7179967761039734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.699178" }, { "step": 4928, "loss": 0.5969555974006653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.784982" }, { "step": 4929, "loss": 0.8188075423240662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.871721" }, { "step": 4930, "loss": 0.7485949397087097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:20.982765" }, { "step": 4931, "loss": 0.6700524091720581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.079336" }, { "step": 4932, "loss": 0.7437383532524109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.176168" }, { "step": 4933, "loss": 0.6609228849411011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.268099" }, { "step": 4934, "loss": 0.36770519614219666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.354055" }, { "step": 4935, "loss": 0.609947919845581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.443878" }, { "step": 4936, "loss": 1.1691408157348633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.534799" }, { "step": 4937, "loss": 0.536351203918457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.622783" }, { "step": 4938, "loss": 0.4919799566268921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.717118" }, { "step": 4939, "loss": 0.6525318026542664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.834869" }, { "step": 4940, "loss": 0.9116221070289612, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:21.921438" }, { "step": 4941, "loss": 0.5798147320747375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.020810" }, { "step": 4942, "loss": 0.38772648572921753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.112722" }, { "step": 4943, "loss": 0.5781566500663757, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.206343" }, { "step": 4944, "loss": 0.9217891693115234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.307044" }, { "step": 4945, "loss": 0.57133948802948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.392802" }, { "step": 4946, "loss": 0.43550583720207214, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.485384" }, { "step": 4947, "loss": 0.6302466988563538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.597114" }, { "step": 4948, "loss": 0.7085608839988708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.690263" }, { "step": 4949, "loss": 0.6869469881057739, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.800140" }, { "step": 4950, "loss": 0.291115939617157, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.885216" }, { "step": 4951, "loss": 0.6595891714096069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:22.974092" }, { "step": 4952, "loss": 0.9027265310287476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.060237" }, { "step": 4953, "loss": 0.5739670395851135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.171955" }, { "step": 4954, "loss": 0.8412516117095947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.282565" }, { "step": 4955, "loss": 0.7217704057693481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.380021" }, { "step": 4956, "loss": 0.5386013388633728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.479664" }, { "step": 4957, "loss": 0.7821775078773499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.565029" }, { "step": 4958, "loss": 0.9377442598342896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.664512" }, { "step": 4959, "loss": 0.6174846887588501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.755153" }, { "step": 4960, "loss": 0.6941519975662231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.847981" }, { "step": 4961, "loss": 0.6575572490692139, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:23.940019" }, { "step": 4962, "loss": 0.5592985153198242, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.033280" }, { "step": 4963, "loss": 0.7168711423873901, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.150344" }, { "step": 4964, "loss": 0.8011460304260254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.276724" }, { "step": 4965, "loss": 0.6063806414604187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.362671" }, { "step": 4966, "loss": 0.5544193387031555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.459817" }, { "step": 4967, "loss": 0.45808085799217224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.578507" }, { "step": 4968, "loss": 0.43647533655166626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.666455" }, { "step": 4969, "loss": 0.7745290398597717, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.806257" }, { "step": 4970, "loss": 0.33707159757614136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.901429" }, { "step": 4971, "loss": 0.9802877902984619, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:24.987339" }, { "step": 4972, "loss": 0.6557285785675049, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.098417" }, { "step": 4973, "loss": 0.9379945993423462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.185669" }, { "step": 4974, "loss": 0.644012451171875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.285889" }, { "step": 4975, "loss": 0.9863481521606445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.373428" }, { "step": 4976, "loss": 0.6722589731216431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.484943" }, { "step": 4977, "loss": 0.6633001565933228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.577060" }, { "step": 4978, "loss": 0.5961211919784546, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.675635" }, { "step": 4979, "loss": 0.4355506896972656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.761347" }, { "step": 4980, "loss": 0.616279661655426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.847180" }, { "step": 4981, "loss": 0.5660017728805542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:25.945868" }, { "step": 4982, "loss": 0.5722951292991638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.038611" }, { "step": 4983, "loss": 0.42637893557548523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.131786" }, { "step": 4984, "loss": 0.7918707132339478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.242879" }, { "step": 4985, "loss": 0.5162423849105835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.344844" }, { "step": 4986, "loss": 0.7594586610794067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.462099" }, { "step": 4987, "loss": 0.7138240933418274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.546970" }, { "step": 4988, "loss": 0.4559468626976013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.630791" }, { "step": 4989, "loss": 0.4496631622314453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.715811" }, { "step": 4990, "loss": 0.4807143807411194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.810491" }, { "step": 4991, "loss": 0.5464977622032166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.896739" }, { "step": 4992, "loss": 0.5469595789909363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:26.992788" }, { "step": 4993, "loss": 0.6547837257385254, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.080179" }, { "step": 4994, "loss": 0.8258038759231567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.189994" }, { "step": 4995, "loss": 0.873200535774231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.301407" }, { "step": 4996, "loss": 0.7649094462394714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.390785" }, { "step": 4997, "loss": 0.414519727230072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.478924" }, { "step": 4998, "loss": 0.43495920300483704, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.571981" }, { "step": 4999, "loss": 1.0806643962860107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.681876" }, { "step": 5000, "loss": 0.42081236839294434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:27.775635" }, { "step": 5001, "loss": 0.5951192378997803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:50.595738" }, { "step": 5002, "loss": 0.7323955297470093, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:50.683386" }, { "step": 5003, "loss": 0.5825838446617126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:50.774630" }, { "step": 5004, "loss": 0.7656702995300293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:50.860716" }, { "step": 5005, "loss": 0.8869602680206299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:50.973508" }, { "step": 5006, "loss": 0.7153304815292358, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.066256" }, { "step": 5007, "loss": 0.708906888961792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.205144" }, { "step": 5008, "loss": 0.6133823990821838, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.298245" }, { "step": 5009, "loss": 0.373102605342865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.390001" }, { "step": 5010, "loss": 0.48624324798583984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.477827" }, { "step": 5011, "loss": 0.7198675870895386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.563799" }, { "step": 5012, "loss": 0.6103211045265198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.650784" }, { "step": 5013, "loss": 0.5076425671577454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.739432" }, { "step": 5014, "loss": 0.4693804383277893, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.824882" }, { "step": 5015, "loss": 0.8187416791915894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.913059" }, { "step": 5016, "loss": 0.45944374799728394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:51.999498" }, { "step": 5017, "loss": 0.3259526789188385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.089647" }, { "step": 5018, "loss": 0.5893322229385376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.181214" }, { "step": 5019, "loss": 0.4903576374053955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.273656" }, { "step": 5020, "loss": 0.6866074800491333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.365559" }, { "step": 5021, "loss": 1.0188701152801514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.490066" }, { "step": 5022, "loss": 0.753882646560669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.574544" }, { "step": 5023, "loss": 0.5718822479248047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.660234" }, { "step": 5024, "loss": 0.6901964545249939, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.747089" }, { "step": 5025, "loss": 0.644472599029541, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.840719" }, { "step": 5026, "loss": 0.6688041687011719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:52.929470" }, { "step": 5027, "loss": 0.7976592779159546, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.014092" }, { "step": 5028, "loss": 0.5451935529708862, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.132157" }, { "step": 5029, "loss": 0.7038506865501404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.223259" }, { "step": 5030, "loss": 0.4473263621330261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.324190" }, { "step": 5031, "loss": 0.7480633854866028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.411251" }, { "step": 5032, "loss": 0.4362540543079376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.507553" }, { "step": 5033, "loss": 0.8380954265594482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.595760" }, { "step": 5034, "loss": 0.8034522533416748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.688490" }, { "step": 5035, "loss": 0.7110193967819214, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.782096" }, { "step": 5036, "loss": 0.8219634294509888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.893459" }, { "step": 5037, "loss": 0.5457364320755005, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:53.979404" }, { "step": 5038, "loss": 0.3781213164329529, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.071549" }, { "step": 5039, "loss": 0.7167928218841553, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.163458" }, { "step": 5040, "loss": 0.601212203502655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.255210" }, { "step": 5041, "loss": 0.6509326100349426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.372773" }, { "step": 5042, "loss": 0.6906476020812988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.460073" }, { "step": 5043, "loss": 0.5912879705429077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.554573" }, { "step": 5044, "loss": 0.25324422121047974, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.639225" }, { "step": 5045, "loss": 0.7913423776626587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.741525" }, { "step": 5046, "loss": 0.5433337092399597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.832891" }, { "step": 5047, "loss": 0.4321343004703522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:54.919485" }, { "step": 5048, "loss": 0.69386225938797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.013195" }, { "step": 5049, "loss": 1.1141939163208008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.098540" }, { "step": 5050, "loss": 0.7368372678756714, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.196835" }, { "step": 5051, "loss": 0.6763082146644592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.284257" }, { "step": 5052, "loss": 0.4290677309036255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.379919" }, { "step": 5053, "loss": 0.7288506031036377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.463950" }, { "step": 5054, "loss": 0.5851567387580872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.559978" }, { "step": 5055, "loss": 0.5925192832946777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.668552" }, { "step": 5056, "loss": 0.8306054472923279, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.753791" }, { "step": 5057, "loss": 0.5277031064033508, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.848062" }, { "step": 5058, "loss": 0.46012288331985474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:55.946637" }, { "step": 5059, "loss": 0.3008827269077301, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.039477" }, { "step": 5060, "loss": 0.37144941091537476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.129714" }, { "step": 5061, "loss": 0.3130144476890564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.215936" }, { "step": 5062, "loss": 0.5671985149383545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.327428" }, { "step": 5063, "loss": 0.3816457688808441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.420498" }, { "step": 5064, "loss": 0.24656365811824799, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.505722" }, { "step": 5065, "loss": 1.0002244710922241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.594419" }, { "step": 5066, "loss": 0.5860727429389954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.697563" }, { "step": 5067, "loss": 1.0522124767303467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.781384" }, { "step": 5068, "loss": 0.4651108980178833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.866459" }, { "step": 5069, "loss": 0.6630339622497559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:56.959692" }, { "step": 5070, "loss": 0.6970082521438599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.053166" }, { "step": 5071, "loss": 0.73664391040802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.172216" }, { "step": 5072, "loss": 0.7130076885223389, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.282447" }, { "step": 5073, "loss": 0.6061368584632874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.371298" }, { "step": 5074, "loss": 0.4522831439971924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.471732" }, { "step": 5075, "loss": 0.7514994740486145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.593432" }, { "step": 5076, "loss": 0.6949359774589539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.680693" }, { "step": 5077, "loss": 0.7874833345413208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.766217" }, { "step": 5078, "loss": 0.8882912993431091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.853960" }, { "step": 5079, "loss": 0.6357581615447998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:57.946422" }, { "step": 5080, "loss": 0.6458977460861206, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.061394" }, { "step": 5081, "loss": 0.8205579519271851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.175601" }, { "step": 5082, "loss": 0.627174437046051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.278663" }, { "step": 5083, "loss": 0.5694891214370728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.392470" }, { "step": 5084, "loss": 0.5759196281433105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.503263" }, { "step": 5085, "loss": 0.9953820705413818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.634596" }, { "step": 5086, "loss": 0.6089091897010803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.745367" }, { "step": 5087, "loss": 0.6281538605690002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.830821" }, { "step": 5088, "loss": 0.5874292850494385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:58.932738" }, { "step": 5089, "loss": 0.6670938730239868, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.028838" }, { "step": 5090, "loss": 0.7170185446739197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.136615" }, { "step": 5091, "loss": 0.8619066476821899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.259327" }, { "step": 5092, "loss": 0.5680777430534363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.354013" }, { "step": 5093, "loss": 0.9130675196647644, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.443155" }, { "step": 5094, "loss": 0.6569489240646362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.532198" }, { "step": 5095, "loss": 0.5293777585029602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.627109" }, { "step": 5096, "loss": 0.8910971879959106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.765382" }, { "step": 5097, "loss": 0.509231448173523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.863162" }, { "step": 5098, "loss": 0.671502947807312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:34:59.948564" }, { "step": 5099, "loss": 0.6821962594985962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.042618" }, { "step": 5100, "loss": 0.8069772720336914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.160427" }, { "step": 5101, "loss": 0.7527914643287659, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.249950" }, { "step": 5102, "loss": 0.5380275845527649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.349804" }, { "step": 5103, "loss": 0.4806023836135864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.442903" }, { "step": 5104, "loss": 0.8489611148834229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.576637" }, { "step": 5105, "loss": 0.527658224105835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.670330" }, { "step": 5106, "loss": 0.656041145324707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.773094" }, { "step": 5107, "loss": 0.598253607749939, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.858878" }, { "step": 5108, "loss": 0.43985095620155334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:00.962562" }, { "step": 5109, "loss": 0.613104522228241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.064458" }, { "step": 5110, "loss": 0.46037226915359497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.155447" }, { "step": 5111, "loss": 0.6824519038200378, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.240412" }, { "step": 5112, "loss": 0.580655574798584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.339021" }, { "step": 5113, "loss": 0.7986278533935547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.464504" }, { "step": 5114, "loss": 0.6683560609817505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.582280" }, { "step": 5115, "loss": 0.5463663935661316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.668006" }, { "step": 5116, "loss": 0.6117937564849854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.754816" }, { "step": 5117, "loss": 0.5207106471061707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.875592" }, { "step": 5118, "loss": 0.7171536684036255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:01.982909" }, { "step": 5119, "loss": 0.5626745223999023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.068997" }, { "step": 5120, "loss": 0.7836592197418213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.169363" }, { "step": 5121, "loss": 0.5542454123497009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.255044" }, { "step": 5122, "loss": 0.4552422761917114, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.353997" }, { "step": 5123, "loss": 0.7540405988693237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.443461" }, { "step": 5124, "loss": 0.4855286478996277, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.538143" }, { "step": 5125, "loss": 1.1178793907165527, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.622587" }, { "step": 5126, "loss": 0.5279051065444946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.717832" }, { "step": 5127, "loss": 0.6171826124191284, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.807545" }, { "step": 5128, "loss": 0.8220392465591431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.895849" }, { "step": 5129, "loss": 0.6405854225158691, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:02.982986" }, { "step": 5130, "loss": 0.2996223270893097, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.069863" }, { "step": 5131, "loss": 0.6055275797843933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.174719" }, { "step": 5132, "loss": 0.6231158375740051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.264347" }, { "step": 5133, "loss": 0.6500022411346436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.354184" }, { "step": 5134, "loss": 0.5910510420799255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.454072" }, { "step": 5135, "loss": 0.7310243844985962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.540657" }, { "step": 5136, "loss": 0.9147123098373413, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.662615" }, { "step": 5137, "loss": 0.9139012098312378, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.774896" }, { "step": 5138, "loss": 0.47716617584228516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.871842" }, { "step": 5139, "loss": 0.6432809829711914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:03.964748" }, { "step": 5140, "loss": 0.8174035549163818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.054884" }, { "step": 5141, "loss": 0.7433757781982422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.151913" }, { "step": 5142, "loss": 0.6848788261413574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.250306" }, { "step": 5143, "loss": 0.5442079901695251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.336555" }, { "step": 5144, "loss": 0.43561917543411255, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.428856" }, { "step": 5145, "loss": 0.546186625957489, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.523114" }, { "step": 5146, "loss": 0.32851094007492065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.611587" }, { "step": 5147, "loss": 0.7564002275466919, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.697842" }, { "step": 5148, "loss": 0.533362865447998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.783182" }, { "step": 5149, "loss": 0.5637890696525574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.870080" }, { "step": 5150, "loss": 0.550150454044342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:04.972646" }, { "step": 5151, "loss": 0.6899356245994568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.071808" }, { "step": 5152, "loss": 0.6629383563995361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.165738" }, { "step": 5153, "loss": 0.8489761352539062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.255766" }, { "step": 5154, "loss": 0.7000207901000977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.365739" }, { "step": 5155, "loss": 1.0517871379852295, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.452651" }, { "step": 5156, "loss": 0.7380095720291138, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.569462" }, { "step": 5157, "loss": 0.7424658536911011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.654490" }, { "step": 5158, "loss": 0.6614516973495483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.743419" }, { "step": 5159, "loss": 0.6801732778549194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.841936" }, { "step": 5160, "loss": 0.8160336017608643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:05.938662" }, { "step": 5161, "loss": 0.6250806450843811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.027512" }, { "step": 5162, "loss": 0.38111984729766846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.113517" }, { "step": 5163, "loss": 0.6185423731803894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.200537" }, { "step": 5164, "loss": 0.606499433517456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.316871" }, { "step": 5165, "loss": 0.28164032101631165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.411867" }, { "step": 5166, "loss": 0.5507909655570984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.505580" }, { "step": 5167, "loss": 0.7213277816772461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.622425" }, { "step": 5168, "loss": 0.6242302060127258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.707026" }, { "step": 5169, "loss": 0.8653358817100525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.792219" }, { "step": 5170, "loss": 0.8508985042572021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.885453" }, { "step": 5171, "loss": 0.5707094073295593, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:06.969768" }, { "step": 5172, "loss": 0.43748360872268677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.055600" }, { "step": 5173, "loss": 0.6067624092102051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.148717" }, { "step": 5174, "loss": 0.32766446471214294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.247712" }, { "step": 5175, "loss": 0.6946417689323425, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.333255" }, { "step": 5176, "loss": 0.46871596574783325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.419128" }, { "step": 5177, "loss": 0.33262407779693604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.510301" }, { "step": 5178, "loss": 0.763990044593811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.594551" }, { "step": 5179, "loss": 0.4958096146583557, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.687883" }, { "step": 5180, "loss": 0.7701265215873718, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.797151" }, { "step": 5181, "loss": 0.7508771419525146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.886666" }, { "step": 5182, "loss": 0.6959789395332336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:07.973724" }, { "step": 5183, "loss": 0.5615055561065674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.068275" }, { "step": 5184, "loss": 0.44615817070007324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.153221" }, { "step": 5185, "loss": 0.7912470102310181, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.237585" }, { "step": 5186, "loss": 0.5567646622657776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.329018" }, { "step": 5187, "loss": 0.552714467048645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.429358" }, { "step": 5188, "loss": 0.9080017805099487, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.553213" }, { "step": 5189, "loss": 0.6858353614807129, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.640227" }, { "step": 5190, "loss": 0.6646381616592407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.753860" }, { "step": 5191, "loss": 0.6860795617103577, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.871807" }, { "step": 5192, "loss": 1.0018224716186523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:08.963645" }, { "step": 5193, "loss": 0.7621273398399353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.080305" }, { "step": 5194, "loss": 0.4891170263290405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.178481" }, { "step": 5195, "loss": 0.4607897400856018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.277495" }, { "step": 5196, "loss": 0.6500136852264404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.361516" }, { "step": 5197, "loss": 0.8147071599960327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.477006" }, { "step": 5198, "loss": 0.7508507966995239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.584679" }, { "step": 5199, "loss": 0.4836161732673645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.669990" }, { "step": 5200, "loss": 0.5416361093521118, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.756156" }, { "step": 5201, "loss": 0.6802971363067627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.847013" }, { "step": 5202, "loss": 0.7954579591751099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:09.956891" }, { "step": 5203, "loss": 0.5375075340270996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.051168" }, { "step": 5204, "loss": 0.43551167845726013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.144419" }, { "step": 5205, "loss": 0.45869180560112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.243700" }, { "step": 5206, "loss": 0.7711325883865356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.329250" }, { "step": 5207, "loss": 0.7653231620788574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.419668" }, { "step": 5208, "loss": 0.39428234100341797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.505359" }, { "step": 5209, "loss": 0.6600005626678467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.591017" }, { "step": 5210, "loss": 0.5370796322822571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.681887" }, { "step": 5211, "loss": 1.12953782081604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.771180" }, { "step": 5212, "loss": 0.6836779117584229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.857095" }, { "step": 5213, "loss": 0.6753286123275757, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:10.955230" }, { "step": 5214, "loss": 0.5806745886802673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.045759" }, { "step": 5215, "loss": 0.7765303254127502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.156795" }, { "step": 5216, "loss": 1.2855310440063477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.246058" }, { "step": 5217, "loss": 0.3974851965904236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.338461" }, { "step": 5218, "loss": 0.5212668180465698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.431632" }, { "step": 5219, "loss": 0.6381855010986328, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.522208" }, { "step": 5220, "loss": 0.5755220651626587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.621589" }, { "step": 5221, "loss": 0.5240416526794434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.707574" }, { "step": 5222, "loss": 0.39984965324401855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.793080" }, { "step": 5223, "loss": 0.4870592951774597, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:11.884507" }, { "step": 5224, "loss": 0.7420036792755127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.000803" }, { "step": 5225, "loss": 0.39653831720352173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.093363" }, { "step": 5226, "loss": 0.7941811084747314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.185543" }, { "step": 5227, "loss": 0.68599534034729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.302762" }, { "step": 5228, "loss": 0.6420697569847107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.388574" }, { "step": 5229, "loss": 0.29388195276260376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.487418" }, { "step": 5230, "loss": 0.7698599696159363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.581960" }, { "step": 5231, "loss": 0.4296623468399048, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.671772" }, { "step": 5232, "loss": 0.8686885833740234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.759053" }, { "step": 5233, "loss": 0.8088715076446533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.845167" }, { "step": 5234, "loss": 0.6407808065414429, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:12.937364" }, { "step": 5235, "loss": 1.1243447065353394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.023975" }, { "step": 5236, "loss": 0.49466371536254883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.123132" }, { "step": 5237, "loss": 0.6473598480224609, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.247623" }, { "step": 5238, "loss": 0.8934952020645142, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.335968" }, { "step": 5239, "loss": 0.5833638906478882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.433568" }, { "step": 5240, "loss": 0.44140511751174927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.526273" }, { "step": 5241, "loss": 0.510111391544342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.610003" }, { "step": 5242, "loss": 0.8450664281845093, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.718436" }, { "step": 5243, "loss": 1.0136253833770752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.811677" }, { "step": 5244, "loss": 0.6410328149795532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.903586" }, { "step": 5245, "loss": 0.4767501950263977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:13.989282" }, { "step": 5246, "loss": 0.6667538285255432, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.079120" }, { "step": 5247, "loss": 0.4306851625442505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.163415" }, { "step": 5248, "loss": 0.9562978744506836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.257854" }, { "step": 5249, "loss": 0.8550502061843872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.342966" }, { "step": 5250, "loss": 0.6880485415458679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.439323" }, { "step": 5251, "loss": 0.5612602829933167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.528940" }, { "step": 5252, "loss": 0.9827108383178711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.617129" }, { "step": 5253, "loss": 0.4732167720794678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.701139" }, { "step": 5254, "loss": 0.6105453968048096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.789568" }, { "step": 5255, "loss": 0.5365049839019775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:14.909206" }, { "step": 5256, "loss": 0.41693925857543945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.003140" }, { "step": 5257, "loss": 0.801144003868103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.090360" }, { "step": 5258, "loss": 0.397297203540802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.184018" }, { "step": 5259, "loss": 0.7830079793930054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.273500" }, { "step": 5260, "loss": 0.5241480469703674, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.383383" }, { "step": 5261, "loss": 0.5170097947120667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.472807" }, { "step": 5262, "loss": 0.6923742890357971, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.566284" }, { "step": 5263, "loss": 0.42461681365966797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.656698" }, { "step": 5264, "loss": 0.5379315614700317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.750464" }, { "step": 5265, "loss": 0.5429901480674744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.863578" }, { "step": 5266, "loss": 0.6550177335739136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:15.951319" }, { "step": 5267, "loss": 0.5870937705039978, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.068535" }, { "step": 5268, "loss": 0.5703401565551758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.162386" }, { "step": 5269, "loss": 0.601983368396759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.248835" }, { "step": 5270, "loss": 0.8342890739440918, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.364992" }, { "step": 5271, "loss": 0.7161109447479248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.451113" }, { "step": 5272, "loss": 0.5550898909568787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.542702" }, { "step": 5273, "loss": 0.7469043135643005, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.648621" }, { "step": 5274, "loss": 0.7208850383758545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.739706" }, { "step": 5275, "loss": 0.7569739818572998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.857212" }, { "step": 5276, "loss": 0.5927835702896118, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:16.955386" }, { "step": 5277, "loss": 0.5642762780189514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.075586" }, { "step": 5278, "loss": 0.47703346610069275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.164490" }, { "step": 5279, "loss": 0.5822703838348389, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.250981" }, { "step": 5280, "loss": 0.7320791482925415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.369627" }, { "step": 5281, "loss": 0.7296905517578125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.462088" }, { "step": 5282, "loss": 0.5532791614532471, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.552961" }, { "step": 5283, "loss": 0.6432331800460815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.662664" }, { "step": 5284, "loss": 0.5252206325531006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.749168" }, { "step": 5285, "loss": 0.7656639814376831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.833537" }, { "step": 5286, "loss": 1.0824252367019653, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:17.930358" }, { "step": 5287, "loss": 0.6591073274612427, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.016359" }, { "step": 5288, "loss": 0.8586819171905518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.108823" }, { "step": 5289, "loss": 0.6848097443580627, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.195646" }, { "step": 5290, "loss": 0.6834993362426758, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.282673" }, { "step": 5291, "loss": 0.6532515287399292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.375167" }, { "step": 5292, "loss": 0.4039452075958252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.473980" }, { "step": 5293, "loss": 0.48468711972236633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.558620" }, { "step": 5294, "loss": 1.1535964012145996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.697151" }, { "step": 5295, "loss": 0.6373159885406494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.794090" }, { "step": 5296, "loss": 0.49422046542167664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.879925" }, { "step": 5297, "loss": 0.9448153972625732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:18.974837" }, { "step": 5298, "loss": 0.7341314554214478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.091413" }, { "step": 5299, "loss": 0.7926164269447327, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.179545" }, { "step": 5300, "loss": 0.468866229057312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.272591" }, { "step": 5301, "loss": 0.5493701100349426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.358353" }, { "step": 5302, "loss": 0.6809881925582886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.452351" }, { "step": 5303, "loss": 0.7910479307174683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.574831" }, { "step": 5304, "loss": 0.9022915363311768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.717408" }, { "step": 5305, "loss": 0.9410111904144287, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.853673" }, { "step": 5306, "loss": 0.40125325322151184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:19.942214" }, { "step": 5307, "loss": 0.46764516830444336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.034290" }, { "step": 5308, "loss": 0.630170464515686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.125220" }, { "step": 5309, "loss": 0.4460214376449585, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.211402" }, { "step": 5310, "loss": 1.1366885900497437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.297845" }, { "step": 5311, "loss": 0.730813205242157, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.387595" }, { "step": 5312, "loss": 0.7450922131538391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.500483" }, { "step": 5313, "loss": 0.5237643718719482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.596072" }, { "step": 5314, "loss": 0.4871298670768738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.687769" }, { "step": 5315, "loss": 0.7882100343704224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.777196" }, { "step": 5316, "loss": 0.8655515909194946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.863982" }, { "step": 5317, "loss": 0.39512526988983154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:20.965572" }, { "step": 5318, "loss": 0.5281268954277039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.092231" }, { "step": 5319, "loss": 0.5935298204421997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.177447" }, { "step": 5320, "loss": 0.7224054932594299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.264214" }, { "step": 5321, "loss": 0.6267576813697815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.348968" }, { "step": 5322, "loss": 0.661434531211853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.468728" }, { "step": 5323, "loss": 0.6012091040611267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.565887" }, { "step": 5324, "loss": 0.9631133079528809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.650256" }, { "step": 5325, "loss": 0.6083294153213501, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.736717" }, { "step": 5326, "loss": 0.810582160949707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.829678" }, { "step": 5327, "loss": 0.7161573171615601, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:21.924774" }, { "step": 5328, "loss": 0.8574742078781128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.013463" }, { "step": 5329, "loss": 0.8996421098709106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.132542" }, { "step": 5330, "loss": 0.825309157371521, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.249563" }, { "step": 5331, "loss": 0.6450573205947876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.335858" }, { "step": 5332, "loss": 0.7526185512542725, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.426453" }, { "step": 5333, "loss": 0.6454386115074158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.522225" }, { "step": 5334, "loss": 0.7778708934783936, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.608938" }, { "step": 5335, "loss": 0.7210675477981567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.701340" }, { "step": 5336, "loss": 0.6998779773712158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.787466" }, { "step": 5337, "loss": 0.6219935417175293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.873023" }, { "step": 5338, "loss": 0.5134443044662476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:22.965672" }, { "step": 5339, "loss": 1.031418800354004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.051076" }, { "step": 5340, "loss": 0.6048306226730347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.136510" }, { "step": 5341, "loss": 0.40462344884872437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.224761" }, { "step": 5342, "loss": 0.8919198513031006, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.327215" }, { "step": 5343, "loss": 0.5340045690536499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.419967" }, { "step": 5344, "loss": 0.8810837268829346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.505599" }, { "step": 5345, "loss": 0.9676270484924316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.591291" }, { "step": 5346, "loss": 0.4701799154281616, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.677808" }, { "step": 5347, "loss": 0.9284703731536865, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.766150" }, { "step": 5348, "loss": 0.8560200929641724, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.878549" }, { "step": 5349, "loss": 0.7633235454559326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:23.981661" }, { "step": 5350, "loss": 0.553311824798584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.081600" }, { "step": 5351, "loss": 0.6665992140769958, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.181762" }, { "step": 5352, "loss": 0.3709503710269928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.268322" }, { "step": 5353, "loss": 0.4934130311012268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.353698" }, { "step": 5354, "loss": 0.8157681226730347, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.446871" }, { "step": 5355, "loss": 0.5500645637512207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.565252" }, { "step": 5356, "loss": 0.763068437576294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.675117" }, { "step": 5357, "loss": 0.4543488621711731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.768618" }, { "step": 5358, "loss": 0.9308655858039856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.854413" }, { "step": 5359, "loss": 0.7274183034896851, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:24.968971" }, { "step": 5360, "loss": 0.7637754082679749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.053753" }, { "step": 5361, "loss": 0.6231275796890259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.145406" }, { "step": 5362, "loss": 0.6072465181350708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.233087" }, { "step": 5363, "loss": 1.1230602264404297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.344421" }, { "step": 5364, "loss": 0.7933127880096436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.455760" }, { "step": 5365, "loss": 1.1109681129455566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.546384" }, { "step": 5366, "loss": 0.9142438173294067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.658073" }, { "step": 5367, "loss": 1.0180119276046753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.750620" }, { "step": 5368, "loss": 0.6398467421531677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.841189" }, { "step": 5369, "loss": 0.6533701419830322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:25.933480" }, { "step": 5370, "loss": 0.9727879762649536, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.024552" }, { "step": 5371, "loss": 0.6157466173171997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.116019" }, { "step": 5372, "loss": 0.5261214971542358, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.201004" }, { "step": 5373, "loss": 0.6708849668502808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.311214" }, { "step": 5374, "loss": 1.0225187540054321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.423030" }, { "step": 5375, "loss": 0.6381993889808655, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.512560" }, { "step": 5376, "loss": 0.6903390884399414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.599045" }, { "step": 5377, "loss": 0.8069884777069092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.718354" }, { "step": 5378, "loss": 0.7906883358955383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.834060" }, { "step": 5379, "loss": 0.9352955222129822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:26.943804" }, { "step": 5380, "loss": 0.6629771590232849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.028180" }, { "step": 5381, "loss": 0.6594962477684021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.128219" }, { "step": 5382, "loss": 0.3965241312980652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.223185" }, { "step": 5383, "loss": 0.7446549534797668, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.313366" }, { "step": 5384, "loss": 0.7740012407302856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.405370" }, { "step": 5385, "loss": 0.5420485734939575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.493411" }, { "step": 5386, "loss": 1.0841143131256104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.601138" }, { "step": 5387, "loss": 0.45963147282600403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.701858" }, { "step": 5388, "loss": 0.8962045907974243, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.794339" }, { "step": 5389, "loss": 0.9207224249839783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.905764" }, { "step": 5390, "loss": 0.451105535030365, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:27.992233" }, { "step": 5391, "loss": 0.6607620120048523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.082524" }, { "step": 5392, "loss": 0.5382044911384583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.183194" }, { "step": 5393, "loss": 0.5554115176200867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.274551" }, { "step": 5394, "loss": 0.8041130304336548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.365907" }, { "step": 5395, "loss": 0.9207351207733154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.453187" }, { "step": 5396, "loss": 0.8844605088233948, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.566189" }, { "step": 5397, "loss": 0.5394970178604126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.652545" }, { "step": 5398, "loss": 0.4043452739715576, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.747457" }, { "step": 5399, "loss": 0.3591093420982361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.839471" }, { "step": 5400, "loss": 0.7817924618721008, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:28.957062" }, { "step": 5401, "loss": 0.7424918413162231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.074187" }, { "step": 5402, "loss": 0.9739941358566284, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.190569" }, { "step": 5403, "loss": 0.7140771150588989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.277936" }, { "step": 5404, "loss": 0.9118127822875977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.371050" }, { "step": 5405, "loss": 0.5426833033561707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.466526" }, { "step": 5406, "loss": 0.8691698908805847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.558300" }, { "step": 5407, "loss": 0.6660234928131104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.643470" }, { "step": 5408, "loss": 0.692325234413147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.754845" }, { "step": 5409, "loss": 0.619080662727356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.871965" }, { "step": 5410, "loss": 0.6115942597389221, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:29.960343" }, { "step": 5411, "loss": 0.6016713380813599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.074134" }, { "step": 5412, "loss": 0.5499423742294312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.159865" }, { "step": 5413, "loss": 0.30482161045074463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.247249" }, { "step": 5414, "loss": 0.5986266136169434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.356906" }, { "step": 5415, "loss": 0.41288888454437256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.448002" }, { "step": 5416, "loss": 0.9673306941986084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.560397" }, { "step": 5417, "loss": 0.5668858885765076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.652083" }, { "step": 5418, "loss": 0.5547785758972168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.748051" }, { "step": 5419, "loss": 1.048303246498108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.863329" }, { "step": 5420, "loss": 0.4744086265563965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:30.949333" }, { "step": 5421, "loss": 0.3299217224121094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.043372" }, { "step": 5422, "loss": 0.5857633948326111, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.156803" }, { "step": 5423, "loss": 0.48149871826171875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.244739" }, { "step": 5424, "loss": 0.7493994832038879, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.330268" }, { "step": 5425, "loss": 0.8016736507415771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.447326" }, { "step": 5426, "loss": 0.7601327896118164, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.533910" }, { "step": 5427, "loss": 0.7173642516136169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.627634" }, { "step": 5428, "loss": 0.9883475303649902, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.720466" }, { "step": 5429, "loss": 0.5989494323730469, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.812695" }, { "step": 5430, "loss": 0.9615006446838379, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:31.925713" }, { "step": 5431, "loss": 0.7180347442626953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.010877" }, { "step": 5432, "loss": 0.4803329408168793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.097302" }, { "step": 5433, "loss": 0.712143063545227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.212822" }, { "step": 5434, "loss": 0.4673738181591034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.299577" }, { "step": 5435, "loss": 0.4736776351928711, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.393917" }, { "step": 5436, "loss": 0.5435335040092468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.489222" }, { "step": 5437, "loss": 0.6186005473136902, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.575738" }, { "step": 5438, "loss": 0.3098321855068207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.663266" }, { "step": 5439, "loss": 0.9513657093048096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.749858" }, { "step": 5440, "loss": 0.4211292862892151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.841024" }, { "step": 5441, "loss": 0.77137291431427, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:32.952409" }, { "step": 5442, "loss": 0.6504303812980652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.061131" }, { "step": 5443, "loss": 0.5651764273643494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.160396" }, { "step": 5444, "loss": 0.32058799266815186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.252437" }, { "step": 5445, "loss": 0.8330054879188538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.343144" }, { "step": 5446, "loss": 0.7379071116447449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.429519" }, { "step": 5447, "loss": 0.6598133444786072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.529036" }, { "step": 5448, "loss": 0.7174714803695679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.614037" }, { "step": 5449, "loss": 0.9190279245376587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.706754" }, { "step": 5450, "loss": 0.7041617631912231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.792677" }, { "step": 5451, "loss": 0.7171375155448914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.877139" }, { "step": 5452, "loss": 0.5621190071105957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:33.999163" }, { "step": 5453, "loss": 0.6729136109352112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.090869" }, { "step": 5454, "loss": 0.3673545718193054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.189695" }, { "step": 5455, "loss": 0.586036741733551, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.286380" }, { "step": 5456, "loss": 0.7679854035377502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.427841" }, { "step": 5457, "loss": 0.33333590626716614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.520078" }, { "step": 5458, "loss": 0.5019077062606812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.614191" }, { "step": 5459, "loss": 0.5199846625328064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.701004" }, { "step": 5460, "loss": 0.5041605234146118, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.798834" }, { "step": 5461, "loss": 0.5721606016159058, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.883762" }, { "step": 5462, "loss": 0.544789731502533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:34.982168" }, { "step": 5463, "loss": 0.4494096636772156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.071576" }, { "step": 5464, "loss": 0.6150014996528625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.157727" }, { "step": 5465, "loss": 0.7446844577789307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.253474" }, { "step": 5466, "loss": 0.7300538420677185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.342779" }, { "step": 5467, "loss": 0.8249831199645996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.458838" }, { "step": 5468, "loss": 0.8058160543441772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.567780" }, { "step": 5469, "loss": 0.8085838556289673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.653333" }, { "step": 5470, "loss": 0.7151392102241516, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.745996" }, { "step": 5471, "loss": 0.49036628007888794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.838556" }, { "step": 5472, "loss": 0.4160985052585602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:35.931872" }, { "step": 5473, "loss": 0.8659253120422363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.049039" }, { "step": 5474, "loss": 1.058165192604065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.135600" }, { "step": 5475, "loss": 0.5151556730270386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.224181" }, { "step": 5476, "loss": 0.4203997552394867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.309128" }, { "step": 5477, "loss": 0.5823208093643188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.408273" }, { "step": 5478, "loss": 0.3535323143005371, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.493185" }, { "step": 5479, "loss": 1.0452781915664673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.579306" }, { "step": 5480, "loss": 1.0725637674331665, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.695368" }, { "step": 5481, "loss": 0.48249685764312744, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.782975" }, { "step": 5482, "loss": 0.4864920973777771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.881525" }, { "step": 5483, "loss": 0.5452286005020142, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:36.972402" }, { "step": 5484, "loss": 0.37673404812812805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.058379" }, { "step": 5485, "loss": 0.585891604423523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.153154" }, { "step": 5486, "loss": 0.6570271849632263, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.249525" }, { "step": 5487, "loss": 0.5943127870559692, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.336937" }, { "step": 5488, "loss": 0.6160401105880737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.426988" }, { "step": 5489, "loss": 0.6575560569763184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.521545" }, { "step": 5490, "loss": 0.5474190711975098, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.613703" }, { "step": 5491, "loss": 0.4395022988319397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.732126" }, { "step": 5492, "loss": 0.8002297282218933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.843074" }, { "step": 5493, "loss": 0.8359085321426392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:37.937007" }, { "step": 5494, "loss": 0.4762163758277893, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.032010" }, { "step": 5495, "loss": 0.5316457152366638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.124978" }, { "step": 5496, "loss": 1.0068575143814087, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.217536" }, { "step": 5497, "loss": 0.5335325598716736, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.337559" }, { "step": 5498, "loss": 0.38391926884651184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.427215" }, { "step": 5499, "loss": 0.8157317638397217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.512508" }, { "step": 5500, "loss": 0.5301922559738159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:35:38.597996" }, { "step": 5501, "loss": 1.069484829902649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:01.678760" }, { "step": 5502, "loss": 0.6244121193885803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:01.772573" }, { "step": 5503, "loss": 0.5977312326431274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:01.857452" }, { "step": 5504, "loss": 0.6433150768280029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:01.950261" }, { "step": 5505, "loss": 0.5856589078903198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.042505" }, { "step": 5506, "loss": 0.4340008497238159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.135634" }, { "step": 5507, "loss": 0.6331439018249512, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.228326" }, { "step": 5508, "loss": 0.5836597681045532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.320410" }, { "step": 5509, "loss": 0.9109430313110352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.411497" }, { "step": 5510, "loss": 0.5677180290222168, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.503712" }, { "step": 5511, "loss": 0.5407057404518127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.592292" }, { "step": 5512, "loss": 0.7564494013786316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.687636" }, { "step": 5513, "loss": 0.6306699514389038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.803416" }, { "step": 5514, "loss": 0.6047378182411194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.889861" }, { "step": 5515, "loss": 0.3515982925891876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:02.983580" }, { "step": 5516, "loss": 0.7020854949951172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.072442" }, { "step": 5517, "loss": 0.469836950302124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.162004" }, { "step": 5518, "loss": 0.5739010572433472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.247316" }, { "step": 5519, "loss": 0.5913133025169373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.331859" }, { "step": 5520, "loss": 0.6165291666984558, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.426161" }, { "step": 5521, "loss": 0.6422848105430603, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.514863" }, { "step": 5522, "loss": 0.5667189359664917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.600405" }, { "step": 5523, "loss": 0.5706440210342407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.716859" }, { "step": 5524, "loss": 1.2217167615890503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.810872" }, { "step": 5525, "loss": 0.6342220902442932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:03.925350" }, { "step": 5526, "loss": 0.4954689145088196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.021450" }, { "step": 5527, "loss": 1.0643612146377563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.121413" }, { "step": 5528, "loss": 0.9879289865493774, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.206420" }, { "step": 5529, "loss": 0.7188736796379089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.297784" }, { "step": 5530, "loss": 0.5565375089645386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.381816" }, { "step": 5531, "loss": 0.8278661370277405, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.476851" }, { "step": 5532, "loss": 0.7808709144592285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.593674" }, { "step": 5533, "loss": 0.7380824685096741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.685885" }, { "step": 5534, "loss": 0.823722243309021, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.778132" }, { "step": 5535, "loss": 0.8058376312255859, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.890192" }, { "step": 5536, "loss": 0.7978777289390564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:04.984965" }, { "step": 5537, "loss": 0.45364677906036377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.076573" }, { "step": 5538, "loss": 0.7086925506591797, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.161799" }, { "step": 5539, "loss": 0.8476694822311401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.252438" }, { "step": 5540, "loss": 0.8700095415115356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.336916" }, { "step": 5541, "loss": 0.44587424397468567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.433222" }, { "step": 5542, "loss": 0.919380784034729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.525310" }, { "step": 5543, "loss": 0.9220453500747681, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.637413" }, { "step": 5544, "loss": 0.6280182600021362, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.751389" }, { "step": 5545, "loss": 0.6377507448196411, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.836598" }, { "step": 5546, "loss": 0.5384541153907776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:05.922809" }, { "step": 5547, "loss": 0.39631667733192444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.007727" }, { "step": 5548, "loss": 0.627833366394043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.099303" }, { "step": 5549, "loss": 0.6499568819999695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.190881" }, { "step": 5550, "loss": 0.6667746305465698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.277561" }, { "step": 5551, "loss": 1.002081036567688, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.387562" }, { "step": 5552, "loss": 0.9571174383163452, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.498259" }, { "step": 5553, "loss": 0.44770193099975586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.588858" }, { "step": 5554, "loss": 0.832943856716156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.679347" }, { "step": 5555, "loss": 0.3153897225856781, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.771686" }, { "step": 5556, "loss": 0.530339241027832, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.857267" }, { "step": 5557, "loss": 0.803686797618866, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:06.943302" }, { "step": 5558, "loss": 0.5215588212013245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.028982" }, { "step": 5559, "loss": 0.5630092024803162, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.140523" }, { "step": 5560, "loss": 0.7353876829147339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.225537" }, { "step": 5561, "loss": 0.5006199479103088, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.324125" }, { "step": 5562, "loss": 0.563177227973938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.441454" }, { "step": 5563, "loss": 0.5240774154663086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.533402" }, { "step": 5564, "loss": 0.6202017068862915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.626708" }, { "step": 5565, "loss": 0.8850138187408447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.720461" }, { "step": 5566, "loss": 0.5358899235725403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.837783" }, { "step": 5567, "loss": 0.28797948360443115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:07.929948" }, { "step": 5568, "loss": 0.7595804929733276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.019697" }, { "step": 5569, "loss": 0.7487918138504028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.137646" }, { "step": 5570, "loss": 0.7596962451934814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.227191" }, { "step": 5571, "loss": 0.6341238617897034, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.333424" }, { "step": 5572, "loss": 0.7128809094429016, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.419372" }, { "step": 5573, "loss": 0.292314350605011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.504891" }, { "step": 5574, "loss": 0.8500514030456543, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.589497" }, { "step": 5575, "loss": 0.2863239347934723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.674262" }, { "step": 5576, "loss": 0.5001517534255981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.759787" }, { "step": 5577, "loss": 0.7835900783538818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.845597" }, { "step": 5578, "loss": 0.7890653610229492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:08.956155" }, { "step": 5579, "loss": 0.5934634208679199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.044512" }, { "step": 5580, "loss": 0.7189675569534302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.163800" }, { "step": 5581, "loss": 0.7127552628517151, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.264033" }, { "step": 5582, "loss": 0.6467348337173462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.352754" }, { "step": 5583, "loss": 0.7936569452285767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.437728" }, { "step": 5584, "loss": 0.6398410797119141, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.529021" }, { "step": 5585, "loss": 0.5076642036437988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.621736" }, { "step": 5586, "loss": 0.6170570254325867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.706080" }, { "step": 5587, "loss": 0.23510873317718506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.802313" }, { "step": 5588, "loss": 0.4230172336101532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.887643" }, { "step": 5589, "loss": 0.6580657958984375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:09.979873" }, { "step": 5590, "loss": 0.6074891686439514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.095724" }, { "step": 5591, "loss": 0.5522722005844116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.182138" }, { "step": 5592, "loss": 0.5334587097167969, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.266118" }, { "step": 5593, "loss": 0.6482205390930176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.360553" }, { "step": 5594, "loss": 0.8095447421073914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.444709" }, { "step": 5595, "loss": 0.5615391731262207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.556449" }, { "step": 5596, "loss": 0.7091141939163208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.667436" }, { "step": 5597, "loss": 0.42119020223617554, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.758424" }, { "step": 5598, "loss": 0.5275241732597351, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.858695" }, { "step": 5599, "loss": 0.7543397545814514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:10.943283" }, { "step": 5600, "loss": 0.24604639410972595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.042039" }, { "step": 5601, "loss": 0.5229141712188721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.129379" }, { "step": 5602, "loss": 1.0131573677062988, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.214641" }, { "step": 5603, "loss": 0.27084001898765564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.303247" }, { "step": 5604, "loss": 0.5638006925582886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.393099" }, { "step": 5605, "loss": 0.2824951112270355, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.480419" }, { "step": 5606, "loss": 0.28887736797332764, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.577339" }, { "step": 5607, "loss": 0.7528221607208252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.687912" }, { "step": 5608, "loss": 0.7317725419998169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.778535" }, { "step": 5609, "loss": 0.6285457611083984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.867330" }, { "step": 5610, "loss": 0.6453640460968018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:11.965032" }, { "step": 5611, "loss": 0.90389084815979, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.051709" }, { "step": 5612, "loss": 0.739693820476532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.137943" }, { "step": 5613, "loss": 1.0084686279296875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.224967" }, { "step": 5614, "loss": 1.0901228189468384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.330717" }, { "step": 5615, "loss": 0.7230225801467896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.423863" }, { "step": 5616, "loss": 0.8009212017059326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.517122" }, { "step": 5617, "loss": 0.39854246377944946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.611147" }, { "step": 5618, "loss": 0.7934306859970093, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.706099" }, { "step": 5619, "loss": 0.9525821805000305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.802724" }, { "step": 5620, "loss": 0.8670251369476318, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:12.912608" }, { "step": 5621, "loss": 0.7981773614883423, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.000007" }, { "step": 5622, "loss": 0.9436773657798767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.093329" }, { "step": 5623, "loss": 0.9227885007858276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.230894" }, { "step": 5624, "loss": 0.39947080612182617, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.321454" }, { "step": 5625, "loss": 0.49277451634407043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.405565" }, { "step": 5626, "loss": 0.6213210821151733, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.493545" }, { "step": 5627, "loss": 0.44442471861839294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.594192" }, { "step": 5628, "loss": 0.7226306200027466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.689064" }, { "step": 5629, "loss": 0.5975019335746765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.774249" }, { "step": 5630, "loss": 0.6392695307731628, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.867798" }, { "step": 5631, "loss": 0.8172416687011719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:13.978960" }, { "step": 5632, "loss": 0.6009588241577148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.066142" }, { "step": 5633, "loss": 0.3634352385997772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.158770" }, { "step": 5634, "loss": 0.8165111541748047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.291462" }, { "step": 5635, "loss": 0.3914180397987366, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.381470" }, { "step": 5636, "loss": 0.5138115286827087, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.474285" }, { "step": 5637, "loss": 0.7316917181015015, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.559255" }, { "step": 5638, "loss": 0.9305991530418396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.665756" }, { "step": 5639, "loss": 0.817363977432251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.762958" }, { "step": 5640, "loss": 0.635474681854248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.854630" }, { "step": 5641, "loss": 0.8039060831069946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:14.948222" }, { "step": 5642, "loss": 0.5635071396827698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.043886" }, { "step": 5643, "loss": 0.37758398056030273, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.130184" }, { "step": 5644, "loss": 0.8428970575332642, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.218927" }, { "step": 5645, "loss": 0.6884297132492065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.312394" }, { "step": 5646, "loss": 0.7362551689147949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.400490" }, { "step": 5647, "loss": 0.8996497392654419, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.485067" }, { "step": 5648, "loss": 0.5149154663085938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.601793" }, { "step": 5649, "loss": 0.6167410612106323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.696160" }, { "step": 5650, "loss": 0.6931764483451843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.812416" }, { "step": 5651, "loss": 0.3935929536819458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.905106" }, { "step": 5652, "loss": 0.7141790390014648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:15.990572" }, { "step": 5653, "loss": 0.6203509569168091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.085913" }, { "step": 5654, "loss": 0.6458877921104431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.178897" }, { "step": 5655, "loss": 0.3789830505847931, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.271605" }, { "step": 5656, "loss": 0.660812258720398, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.382731" }, { "step": 5657, "loss": 0.768876314163208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.495791" }, { "step": 5658, "loss": 0.626073956489563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.581501" }, { "step": 5659, "loss": 0.8127492666244507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.696382" }, { "step": 5660, "loss": 0.2597505450248718, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.781566" }, { "step": 5661, "loss": 0.5234634280204773, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.893942" }, { "step": 5662, "loss": 0.6957606673240662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:16.979110" }, { "step": 5663, "loss": 0.6869414448738098, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.071741" }, { "step": 5664, "loss": 0.5302432775497437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.156473" }, { "step": 5665, "loss": 0.6929314136505127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.270386" }, { "step": 5666, "loss": 0.4730122983455658, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.357970" }, { "step": 5667, "loss": 0.5067132711410522, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.444391" }, { "step": 5668, "loss": 1.1211423873901367, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.529503" }, { "step": 5669, "loss": 0.6299549341201782, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.647837" }, { "step": 5670, "loss": 0.7017507553100586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.741361" }, { "step": 5671, "loss": 0.7918597459793091, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.836228" }, { "step": 5672, "loss": 0.4024396538734436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:17.953459" }, { "step": 5673, "loss": 0.721580445766449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.049061" }, { "step": 5674, "loss": 0.41677939891815186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.141510" }, { "step": 5675, "loss": 0.43923014402389526, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.253892" }, { "step": 5676, "loss": 0.5398375988006592, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.339289" }, { "step": 5677, "loss": 0.5534284114837646, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.426282" }, { "step": 5678, "loss": 0.5321100950241089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.516905" }, { "step": 5679, "loss": 0.5441781878471375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.633891" }, { "step": 5680, "loss": 0.31380826234817505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.732475" }, { "step": 5681, "loss": 0.66438227891922, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.852767" }, { "step": 5682, "loss": 0.531139612197876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:18.938378" }, { "step": 5683, "loss": 0.679900050163269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.048621" }, { "step": 5684, "loss": 0.5136862993240356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.136323" }, { "step": 5685, "loss": 0.5323426723480225, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.221031" }, { "step": 5686, "loss": 0.8125777840614319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.308961" }, { "step": 5687, "loss": 0.8911144733428955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.428381" }, { "step": 5688, "loss": 0.7599362134933472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.512612" }, { "step": 5689, "loss": 0.6044619679450989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.608571" }, { "step": 5690, "loss": 0.7708256840705872, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.710724" }, { "step": 5691, "loss": 0.8096296787261963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.827065" }, { "step": 5692, "loss": 0.9449350833892822, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:19.933817" }, { "step": 5693, "loss": 1.148485779762268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.025442" }, { "step": 5694, "loss": 0.53568434715271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.124729" }, { "step": 5695, "loss": 0.7837378978729248, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.220754" }, { "step": 5696, "loss": 1.3290468454360962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.307183" }, { "step": 5697, "loss": 0.7056277990341187, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.399439" }, { "step": 5698, "loss": 0.7229843139648438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.487151" }, { "step": 5699, "loss": 0.6728113889694214, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.576073" }, { "step": 5700, "loss": 0.7151197195053101, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.661067" }, { "step": 5701, "loss": 0.6461265087127686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.747731" }, { "step": 5702, "loss": 0.6203290820121765, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.835440" }, { "step": 5703, "loss": 0.7503830194473267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:20.925786" }, { "step": 5704, "loss": 0.3669392764568329, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.015809" }, { "step": 5705, "loss": 0.8296014070510864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.127589" }, { "step": 5706, "loss": 0.6905599236488342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.240695" }, { "step": 5707, "loss": 0.7569985389709473, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.377647" }, { "step": 5708, "loss": 0.6519213318824768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.468726" }, { "step": 5709, "loss": 0.7407724857330322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.553131" }, { "step": 5710, "loss": 0.7708756923675537, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.648973" }, { "step": 5711, "loss": 0.5742967128753662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.742842" }, { "step": 5712, "loss": 0.3772798776626587, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.835361" }, { "step": 5713, "loss": 0.48609817028045654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:21.936741" }, { "step": 5714, "loss": 0.8870813250541687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.024810" }, { "step": 5715, "loss": 0.4052647054195404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.110720" }, { "step": 5716, "loss": 0.4161339998245239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.204398" }, { "step": 5717, "loss": 0.6613152027130127, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.296549" }, { "step": 5718, "loss": 0.5337086915969849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.409652" }, { "step": 5719, "loss": 0.4820641875267029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.506605" }, { "step": 5720, "loss": 0.34211283922195435, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.596779" }, { "step": 5721, "loss": 0.6397532820701599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.692362" }, { "step": 5722, "loss": 0.720239520072937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.778214" }, { "step": 5723, "loss": 0.5129733085632324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.904816" }, { "step": 5724, "loss": 0.7127435207366943, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:22.995651" }, { "step": 5725, "loss": 0.7054228782653809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.082300" }, { "step": 5726, "loss": 0.513144850730896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.168396" }, { "step": 5727, "loss": 0.56893390417099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.254139" }, { "step": 5728, "loss": 0.5451650619506836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.346884" }, { "step": 5729, "loss": 0.8534842729568481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.454397" }, { "step": 5730, "loss": 0.7874561548233032, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.540477" }, { "step": 5731, "loss": 0.6573663949966431, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.639183" }, { "step": 5732, "loss": 0.6281607747077942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.739436" }, { "step": 5733, "loss": 0.6630299091339111, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.833553" }, { "step": 5734, "loss": 0.6079042553901672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:23.927653" }, { "step": 5735, "loss": 0.5658852458000183, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.013751" }, { "step": 5736, "loss": 0.4198507070541382, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.137051" }, { "step": 5737, "loss": 0.5705596208572388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.222856" }, { "step": 5738, "loss": 0.561165988445282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.311348" }, { "step": 5739, "loss": 0.39299657940864563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.403573" }, { "step": 5740, "loss": 0.5350469946861267, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.489321" }, { "step": 5741, "loss": 0.48758089542388916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.581942" }, { "step": 5742, "loss": 0.35415488481521606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.667509" }, { "step": 5743, "loss": 0.6598008871078491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.754430" }, { "step": 5744, "loss": 0.440854549407959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.839247" }, { "step": 5745, "loss": 0.4634512662887573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:24.926142" }, { "step": 5746, "loss": 0.5493180155754089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.012043" }, { "step": 5747, "loss": 0.8293261528015137, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.105177" }, { "step": 5748, "loss": 0.6530951857566833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.195255" }, { "step": 5749, "loss": 0.8672972917556763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.279557" }, { "step": 5750, "loss": 0.4747008681297302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.371375" }, { "step": 5751, "loss": 0.3172646164894104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.462216" }, { "step": 5752, "loss": 0.750555157661438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.551207" }, { "step": 5753, "loss": 0.49906665086746216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.645965" }, { "step": 5754, "loss": 0.41441139578819275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.737921" }, { "step": 5755, "loss": 0.6423462629318237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.822842" }, { "step": 5756, "loss": 0.8580732345581055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:25.912626" }, { "step": 5757, "loss": 0.9686923623085022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.053014" }, { "step": 5758, "loss": 0.51237952709198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.139070" }, { "step": 5759, "loss": 0.8733443021774292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.250837" }, { "step": 5760, "loss": 0.44142621755599976, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.342761" }, { "step": 5761, "loss": 0.652829110622406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.429699" }, { "step": 5762, "loss": 0.5451958179473877, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.519924" }, { "step": 5763, "loss": 0.5840594172477722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.605765" }, { "step": 5764, "loss": 0.532623827457428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.699979" }, { "step": 5765, "loss": 0.7662405967712402, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.793656" }, { "step": 5766, "loss": 0.46170634031295776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.878913" }, { "step": 5767, "loss": 0.6902436017990112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:26.987935" }, { "step": 5768, "loss": 0.8028832077980042, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.074488" }, { "step": 5769, "loss": 0.48889946937561035, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.173408" }, { "step": 5770, "loss": 0.6389898061752319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.264562" }, { "step": 5771, "loss": 1.160046935081482, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.386735" }, { "step": 5772, "loss": 0.45359474420547485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.471758" }, { "step": 5773, "loss": 0.649972677230835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.565505" }, { "step": 5774, "loss": 0.6480761170387268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.674741" }, { "step": 5775, "loss": 0.4968363642692566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.760911" }, { "step": 5776, "loss": 0.5223017930984497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.879279" }, { "step": 5777, "loss": 0.7830712199211121, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:27.965916" }, { "step": 5778, "loss": 0.8790167570114136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.108331" }, { "step": 5779, "loss": 0.5744434595108032, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.199199" }, { "step": 5780, "loss": 0.9198564291000366, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.294714" }, { "step": 5781, "loss": 0.5261290669441223, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.389843" }, { "step": 5782, "loss": 0.5671740174293518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.479863" }, { "step": 5783, "loss": 0.5203784704208374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.606738" }, { "step": 5784, "loss": 0.7219885587692261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.716355" }, { "step": 5785, "loss": 1.305742859840393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.798303" }, { "step": 5786, "loss": 0.5374019145965576, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.883562" }, { "step": 5787, "loss": 0.7947397232055664, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:28.978289" }, { "step": 5788, "loss": 0.8574886322021484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.063704" }, { "step": 5789, "loss": 0.6941810250282288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.152617" }, { "step": 5790, "loss": 0.34460991621017456, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.238403" }, { "step": 5791, "loss": 0.5838771462440491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.331433" }, { "step": 5792, "loss": 0.6624184250831604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.430409" }, { "step": 5793, "loss": 0.6822004914283752, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.546675" }, { "step": 5794, "loss": 0.37355536222457886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.646997" }, { "step": 5795, "loss": 0.8220003843307495, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.761363" }, { "step": 5796, "loss": 0.7633988261222839, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.873338" }, { "step": 5797, "loss": 0.5532153248786926, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:29.966453" }, { "step": 5798, "loss": 1.0513670444488525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.078526" }, { "step": 5799, "loss": 0.8101824522018433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.169181" }, { "step": 5800, "loss": 0.5199915170669556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.255971" }, { "step": 5801, "loss": 0.7918421626091003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.369138" }, { "step": 5802, "loss": 0.7365670204162598, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.456262" }, { "step": 5803, "loss": 0.8026846647262573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.555967" }, { "step": 5804, "loss": 1.1632275581359863, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.647197" }, { "step": 5805, "loss": 0.780371904373169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.733510" }, { "step": 5806, "loss": 0.8066176176071167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.849056" }, { "step": 5807, "loss": 1.0424830913543701, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:30.941031" }, { "step": 5808, "loss": 0.3051396310329437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.031804" }, { "step": 5809, "loss": 0.5652732849121094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.161169" }, { "step": 5810, "loss": 0.3412977457046509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.246987" }, { "step": 5811, "loss": 0.68146151304245, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.354868" }, { "step": 5812, "loss": 0.5950397849082947, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.477359" }, { "step": 5813, "loss": 0.9685578942298889, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.605380" }, { "step": 5814, "loss": 1.1698839664459229, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.722575" }, { "step": 5815, "loss": 0.6958124041557312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.808426" }, { "step": 5816, "loss": 0.8408294916152954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:31.919790" }, { "step": 5817, "loss": 0.7168868780136108, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.033664" }, { "step": 5818, "loss": 0.9514514207839966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.128937" }, { "step": 5819, "loss": 0.6021528840065002, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.217973" }, { "step": 5820, "loss": 0.4247845411300659, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.314048" }, { "step": 5821, "loss": 0.39203837513923645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.409010" }, { "step": 5822, "loss": 0.5314009785652161, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.501606" }, { "step": 5823, "loss": 0.43554913997650146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.589566" }, { "step": 5824, "loss": 0.7212445735931396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.703707" }, { "step": 5825, "loss": 0.6576374173164368, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.789851" }, { "step": 5826, "loss": 0.5771899223327637, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.887974" }, { "step": 5827, "loss": 0.8082834482192993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:32.985951" }, { "step": 5828, "loss": 1.0622189044952393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.078701" }, { "step": 5829, "loss": 0.5625197887420654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.167077" }, { "step": 5830, "loss": 0.34767255187034607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.259455" }, { "step": 5831, "loss": 0.5251566767692566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.351999" }, { "step": 5832, "loss": 0.8270056247711182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.450401" }, { "step": 5833, "loss": 0.6659413576126099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.551635" }, { "step": 5834, "loss": 0.5450518131256104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.670027" }, { "step": 5835, "loss": 0.5933257341384888, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.761190" }, { "step": 5836, "loss": 0.7416675090789795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.850749" }, { "step": 5837, "loss": 0.7284349203109741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:33.946769" }, { "step": 5838, "loss": 0.7588080763816833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.040095" }, { "step": 5839, "loss": 0.7072938084602356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.138015" }, { "step": 5840, "loss": 0.5629714131355286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.248409" }, { "step": 5841, "loss": 0.2248498797416687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.341329" }, { "step": 5842, "loss": 0.5705032348632812, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.433417" }, { "step": 5843, "loss": 0.36318275332450867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.518827" }, { "step": 5844, "loss": 0.8575214743614197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.605502" }, { "step": 5845, "loss": 0.6391345262527466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.693914" }, { "step": 5846, "loss": 0.69350266456604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.778892" }, { "step": 5847, "loss": 0.7588538527488708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.866877" }, { "step": 5848, "loss": 0.7628508806228638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:34.981462" }, { "step": 5849, "loss": 0.9422537088394165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.098341" }, { "step": 5850, "loss": 0.5388545393943787, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.190230" }, { "step": 5851, "loss": 0.5409677624702454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.276179" }, { "step": 5852, "loss": 1.1208152770996094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.361770" }, { "step": 5853, "loss": 0.32522836327552795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.449043" }, { "step": 5854, "loss": 0.5548256039619446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.557279" }, { "step": 5855, "loss": 0.9676598906517029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.664392" }, { "step": 5856, "loss": 0.5211814641952515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.757169" }, { "step": 5857, "loss": 0.9397932887077332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.874248" }, { "step": 5858, "loss": 0.32712531089782715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:35.960423" }, { "step": 5859, "loss": 0.5464498996734619, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.048988" }, { "step": 5860, "loss": 0.6092755198478699, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.135359" }, { "step": 5861, "loss": 0.4704321026802063, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.232122" }, { "step": 5862, "loss": 0.7386331558227539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.346405" }, { "step": 5863, "loss": 0.6750144958496094, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.440877" }, { "step": 5864, "loss": 0.7462677359580994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.560007" }, { "step": 5865, "loss": 0.6382085084915161, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.650946" }, { "step": 5866, "loss": 0.7166619896888733, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.738462" }, { "step": 5867, "loss": 0.7537093162536621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.850185" }, { "step": 5868, "loss": 0.5959802865982056, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:36.937257" }, { "step": 5869, "loss": 0.6570081114768982, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.021586" }, { "step": 5870, "loss": 0.7353675961494446, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.112722" }, { "step": 5871, "loss": 0.8188416361808777, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.197762" }, { "step": 5872, "loss": 0.4337729811668396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.294422" }, { "step": 5873, "loss": 0.6895669102668762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.379844" }, { "step": 5874, "loss": 0.8857020735740662, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.465585" }, { "step": 5875, "loss": 0.37234750390052795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.552191" }, { "step": 5876, "loss": 0.6168774366378784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.667195" }, { "step": 5877, "loss": 0.7453489303588867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.758915" }, { "step": 5878, "loss": 0.6031239628791809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.850940" }, { "step": 5879, "loss": 0.4633709788322449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:37.944149" }, { "step": 5880, "loss": 0.4003934860229492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.036037" }, { "step": 5881, "loss": 0.5753026008605957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.120902" }, { "step": 5882, "loss": 0.4765916168689728, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.205639" }, { "step": 5883, "loss": 0.46081897616386414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.298542" }, { "step": 5884, "loss": 0.7254297733306885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.384721" }, { "step": 5885, "loss": 0.6112894415855408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.502143" }, { "step": 5886, "loss": 0.6036748290061951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.592201" }, { "step": 5887, "loss": 0.5821104645729065, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.688271" }, { "step": 5888, "loss": 0.6874103546142578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.773689" }, { "step": 5889, "loss": 0.6802351474761963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.865769" }, { "step": 5890, "loss": 0.6211977601051331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:38.958793" }, { "step": 5891, "loss": 0.4410836100578308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.051683" }, { "step": 5892, "loss": 0.4951089024543762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.150396" }, { "step": 5893, "loss": 0.8480334281921387, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.246720" }, { "step": 5894, "loss": 0.5130068063735962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.339126" }, { "step": 5895, "loss": 0.5607362985610962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.455360" }, { "step": 5896, "loss": 0.8908753395080566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.559353" }, { "step": 5897, "loss": 0.5460812449455261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.649843" }, { "step": 5898, "loss": 0.8652976751327515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.734865" }, { "step": 5899, "loss": 0.8472335338592529, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.821354" }, { "step": 5900, "loss": 0.44766220450401306, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:39.915295" }, { "step": 5901, "loss": 0.5553398132324219, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.012952" }, { "step": 5902, "loss": 0.6585631370544434, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.101474" }, { "step": 5903, "loss": 0.683377742767334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.195452" }, { "step": 5904, "loss": 0.38390272855758667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.279494" }, { "step": 5905, "loss": 1.0160627365112305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.389901" }, { "step": 5906, "loss": 0.446743369102478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.483109" }, { "step": 5907, "loss": 0.5254479050636292, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.572867" }, { "step": 5908, "loss": 0.634061336517334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.681564" }, { "step": 5909, "loss": 0.7702344655990601, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.794728" }, { "step": 5910, "loss": 0.783619225025177, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.903653" }, { "step": 5911, "loss": 0.5501792430877686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:40.998566" }, { "step": 5912, "loss": 0.5581060647964478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.096768" }, { "step": 5913, "loss": 0.6582910418510437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.181107" }, { "step": 5914, "loss": 0.37706252932548523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.266880" }, { "step": 5915, "loss": 0.41323214769363403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.362455" }, { "step": 5916, "loss": 0.750825047492981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.474420" }, { "step": 5917, "loss": 0.4847870171070099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.565694" }, { "step": 5918, "loss": 0.49137604236602783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.659289" }, { "step": 5919, "loss": 0.8015053272247314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.743667" }, { "step": 5920, "loss": 0.9358921051025391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.854001" }, { "step": 5921, "loss": 0.8345065116882324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:41.961005" }, { "step": 5922, "loss": 0.42859265208244324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.049077" }, { "step": 5923, "loss": 1.224048137664795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.137240" }, { "step": 5924, "loss": 0.7930411100387573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.251818" }, { "step": 5925, "loss": 0.4475371837615967, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.355370" }, { "step": 5926, "loss": 0.6195845603942871, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.441571" }, { "step": 5927, "loss": 0.7014752626419067, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.526439" }, { "step": 5928, "loss": 0.5047822594642639, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.618224" }, { "step": 5929, "loss": 1.1633228063583374, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.710466" }, { "step": 5930, "loss": 0.40616297721862793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.809907" }, { "step": 5931, "loss": 0.44736796617507935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.898272" }, { "step": 5932, "loss": 0.6938947439193726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:42.986284" }, { "step": 5933, "loss": 0.5915320515632629, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.071350" }, { "step": 5934, "loss": 0.6396077871322632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.182190" }, { "step": 5935, "loss": 0.5278573036193848, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.266732" }, { "step": 5936, "loss": 0.7449432611465454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.358108" }, { "step": 5937, "loss": 0.4357483983039856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.451559" }, { "step": 5938, "loss": 0.29153719544410706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.566631" }, { "step": 5939, "loss": 0.7246004939079285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.650954" }, { "step": 5940, "loss": 0.6290202140808105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.772303" }, { "step": 5941, "loss": 1.2892699241638184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.857918" }, { "step": 5942, "loss": 0.37840723991394043, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:43.949754" }, { "step": 5943, "loss": 0.579164445400238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.065858" }, { "step": 5944, "loss": 0.7609965801239014, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.153518" }, { "step": 5945, "loss": 0.687138557434082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.263925" }, { "step": 5946, "loss": 0.294299453496933, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.362133" }, { "step": 5947, "loss": 0.8553895950317383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.476752" }, { "step": 5948, "loss": 0.5105088949203491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.565523" }, { "step": 5949, "loss": 0.5741817951202393, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.662123" }, { "step": 5950, "loss": 0.4122381806373596, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.748213" }, { "step": 5951, "loss": 0.614087700843811, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.840580" }, { "step": 5952, "loss": 0.7532903552055359, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:44.929697" }, { "step": 5953, "loss": 0.3205457627773285, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.026923" }, { "step": 5954, "loss": 0.7831594944000244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.114536" }, { "step": 5955, "loss": 0.6618998050689697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.201117" }, { "step": 5956, "loss": 0.3618429899215698, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.294609" }, { "step": 5957, "loss": 0.6709098815917969, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.387946" }, { "step": 5958, "loss": 1.2290711402893066, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.473680" }, { "step": 5959, "loss": 0.8762639760971069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.583001" }, { "step": 5960, "loss": 0.6828989386558533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.679869" }, { "step": 5961, "loss": 0.5198712944984436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.778283" }, { "step": 5962, "loss": 0.7255573272705078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.864468" }, { "step": 5963, "loss": 0.7480034828186035, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:45.958926" }, { "step": 5964, "loss": 0.6150442957878113, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.052006" }, { "step": 5965, "loss": 0.5047993063926697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.143010" }, { "step": 5966, "loss": 0.3626756966114044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.235785" }, { "step": 5967, "loss": 0.6977856159210205, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.380266" }, { "step": 5968, "loss": 0.44238653779029846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.465399" }, { "step": 5969, "loss": 0.7313656806945801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.561291" }, { "step": 5970, "loss": 0.7278785705566406, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.673292" }, { "step": 5971, "loss": 1.2209076881408691, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.760444" }, { "step": 5972, "loss": 0.8943623900413513, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.847035" }, { "step": 5973, "loss": 0.9165500998497009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:46.960932" }, { "step": 5974, "loss": 0.5101460814476013, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.053906" }, { "step": 5975, "loss": 0.7611429691314697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.174059" }, { "step": 5976, "loss": 0.6266164183616638, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.261920" }, { "step": 5977, "loss": 0.6860606074333191, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.352207" }, { "step": 5978, "loss": 0.6604616641998291, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.439958" }, { "step": 5979, "loss": 0.48386234045028687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.526985" }, { "step": 5980, "loss": 0.6971194744110107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.619467" }, { "step": 5981, "loss": 0.3162774443626404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.712816" }, { "step": 5982, "loss": 0.5253907442092896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.800209" }, { "step": 5983, "loss": 0.6419278979301453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:47.917288" }, { "step": 5984, "loss": 0.4822232127189636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.002289" }, { "step": 5985, "loss": 0.5951788425445557, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.098734" }, { "step": 5986, "loss": 0.8916918039321899, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.187079" }, { "step": 5987, "loss": 0.7542407512664795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.278754" }, { "step": 5988, "loss": 0.4329749047756195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.364422" }, { "step": 5989, "loss": 0.8309028744697571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.482008" }, { "step": 5990, "loss": 0.6378041505813599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.581549" }, { "step": 5991, "loss": 0.4396420121192932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.667486" }, { "step": 5992, "loss": 0.5084913372993469, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.775928" }, { "step": 5993, "loss": 0.9170872569084167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.885454" }, { "step": 5994, "loss": 0.6892221570014954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:48.978098" }, { "step": 5995, "loss": 0.9382236003875732, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.088509" }, { "step": 5996, "loss": 0.38317012786865234, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.177245" }, { "step": 5997, "loss": 0.618238627910614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.270798" }, { "step": 5998, "loss": 0.4868793189525604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.384762" }, { "step": 5999, "loss": 0.3476071059703827, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.472224" }, { "step": 6000, "loss": 0.6577726006507874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:36:49.563438" }, { "step": 6001, "loss": 0.6220020055770874, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:12.820274" }, { "step": 6002, "loss": 0.6280674934387207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:12.914938" }, { "step": 6003, "loss": 0.5537983179092407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.003529" }, { "step": 6004, "loss": 0.7024269104003906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.098272" }, { "step": 6005, "loss": 0.6608760952949524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.216833" }, { "step": 6006, "loss": 0.6798566579818726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.306379" }, { "step": 6007, "loss": 0.7898858189582825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.393629" }, { "step": 6008, "loss": 0.7394996881484985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.490803" }, { "step": 6009, "loss": 0.4293012022972107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.577926" }, { "step": 6010, "loss": 0.7847177386283875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.692597" }, { "step": 6011, "loss": 0.9033337831497192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.799188" }, { "step": 6012, "loss": 1.0285292863845825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.893104" }, { "step": 6013, "loss": 0.8120578527450562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:13.980527" }, { "step": 6014, "loss": 0.6473052501678467, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.079261" }, { "step": 6015, "loss": 0.5964269638061523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.168053" }, { "step": 6016, "loss": 0.2951844334602356, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.261499" }, { "step": 6017, "loss": 0.36074885725975037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.358152" }, { "step": 6018, "loss": 0.663282036781311, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.471447" }, { "step": 6019, "loss": 0.518700361251831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.574867" }, { "step": 6020, "loss": 1.0827720165252686, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.666502" }, { "step": 6021, "loss": 0.6328470706939697, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.789299" }, { "step": 6022, "loss": 0.8920124769210815, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.882110" }, { "step": 6023, "loss": 0.7179198265075684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:14.974441" }, { "step": 6024, "loss": 0.8592641353607178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.087339" }, { "step": 6025, "loss": 0.9697800874710083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.201300" }, { "step": 6026, "loss": 0.552260160446167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.296385" }, { "step": 6027, "loss": 0.5309256315231323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.381391" }, { "step": 6028, "loss": 0.4961375892162323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.468640" }, { "step": 6029, "loss": 0.7041685581207275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.584735" }, { "step": 6030, "loss": 0.5238998532295227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.677776" }, { "step": 6031, "loss": 0.4406386613845825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.771798" }, { "step": 6032, "loss": 0.7084073424339294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.860346" }, { "step": 6033, "loss": 0.6187645792961121, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:15.949356" }, { "step": 6034, "loss": 0.4999510645866394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.036543" }, { "step": 6035, "loss": 0.5617572665214539, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.128570" }, { "step": 6036, "loss": 0.7096449136734009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.223017" }, { "step": 6037, "loss": 0.5596957206726074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.314275" }, { "step": 6038, "loss": 0.960456371307373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.433567" }, { "step": 6039, "loss": 0.4244721531867981, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.552174" }, { "step": 6040, "loss": 0.7902840375900269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.646914" }, { "step": 6041, "loss": 0.8126105070114136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.740738" }, { "step": 6042, "loss": 0.8727852702140808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.858880" }, { "step": 6043, "loss": 0.5193896889686584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:16.960068" }, { "step": 6044, "loss": 0.508758544921875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.054720" }, { "step": 6045, "loss": 0.44461750984191895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.140859" }, { "step": 6046, "loss": 0.6480474472045898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.226245" }, { "step": 6047, "loss": 0.8986494541168213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.320987" }, { "step": 6048, "loss": 0.5652695894241333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.413255" }, { "step": 6049, "loss": 0.7855355739593506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.513877" }, { "step": 6050, "loss": 1.0974236726760864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.628927" }, { "step": 6051, "loss": 0.689873456954956, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.724978" }, { "step": 6052, "loss": 0.7081879377365112, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.820987" }, { "step": 6053, "loss": 0.6971246004104614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:17.935382" }, { "step": 6054, "loss": 0.5776461362838745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.020467" }, { "step": 6055, "loss": 0.3687437176704407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.108340" }, { "step": 6056, "loss": 0.5488094687461853, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.229544" }, { "step": 6057, "loss": 0.5630266070365906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.315448" }, { "step": 6058, "loss": 0.5596774816513062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.410250" }, { "step": 6059, "loss": 0.7749810814857483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.533208" }, { "step": 6060, "loss": 0.33865585923194885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.631437" }, { "step": 6061, "loss": 0.972136378288269, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.745223" }, { "step": 6062, "loss": 0.5299461483955383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.833989" }, { "step": 6063, "loss": 0.5798065662384033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:18.936073" }, { "step": 6064, "loss": 0.7596538066864014, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.068627" }, { "step": 6065, "loss": 0.39173340797424316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.155187" }, { "step": 6066, "loss": 0.44091466069221497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.240912" }, { "step": 6067, "loss": 0.6339828968048096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.353224" }, { "step": 6068, "loss": 1.1501743793487549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.449184" }, { "step": 6069, "loss": 0.5024289488792419, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.538484" }, { "step": 6070, "loss": 0.474955677986145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.629123" }, { "step": 6071, "loss": 0.6414593458175659, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.750216" }, { "step": 6072, "loss": 0.4494363069534302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.843057" }, { "step": 6073, "loss": 0.294528990983963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:19.935820" }, { "step": 6074, "loss": 0.5248681306838989, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.027165" }, { "step": 6075, "loss": 0.6838059425354004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.113676" }, { "step": 6076, "loss": 0.8741159439086914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.198351" }, { "step": 6077, "loss": 0.5322624444961548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.289169" }, { "step": 6078, "loss": 0.754462480545044, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.375652" }, { "step": 6079, "loss": 0.6615715622901917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.468203" }, { "step": 6080, "loss": 0.9003994464874268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.582093" }, { "step": 6081, "loss": 0.5272848010063171, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.682614" }, { "step": 6082, "loss": 0.5458800792694092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.767596" }, { "step": 6083, "loss": 0.41118189692497253, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.863789" }, { "step": 6084, "loss": 0.4492420554161072, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:20.963077" }, { "step": 6085, "loss": 0.5060544013977051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.056742" }, { "step": 6086, "loss": 0.663295328617096, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.154703" }, { "step": 6087, "loss": 0.779157280921936, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.246179" }, { "step": 6088, "loss": 0.9119932651519775, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.359387" }, { "step": 6089, "loss": 0.42066264152526855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.461367" }, { "step": 6090, "loss": 0.6574292182922363, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.561134" }, { "step": 6091, "loss": 0.6491479277610779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.677357" }, { "step": 6092, "loss": 0.3916025757789612, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.770795" }, { "step": 6093, "loss": 0.5996114015579224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:21.864270" }, { "step": 6094, "loss": 0.6048060059547424, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.012839" }, { "step": 6095, "loss": 0.323758989572525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.104946" }, { "step": 6096, "loss": 0.45359694957733154, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.195031" }, { "step": 6097, "loss": 0.44892215728759766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.291138" }, { "step": 6098, "loss": 0.6968862414360046, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.400379" }, { "step": 6099, "loss": 0.46126583218574524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.490598" }, { "step": 6100, "loss": 0.8830605745315552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.576082" }, { "step": 6101, "loss": 0.41606491804122925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.673935" }, { "step": 6102, "loss": 0.7578031420707703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.760363" }, { "step": 6103, "loss": 0.5335155129432678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.875360" }, { "step": 6104, "loss": 0.504923939704895, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:22.960916" }, { "step": 6105, "loss": 0.5979379415512085, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.047829" }, { "step": 6106, "loss": 0.4021149277687073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.141564" }, { "step": 6107, "loss": 0.3469591736793518, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.233372" }, { "step": 6108, "loss": 0.7807942628860474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.319387" }, { "step": 6109, "loss": 0.9269797801971436, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.404705" }, { "step": 6110, "loss": 0.42885148525238037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.499085" }, { "step": 6111, "loss": 0.48931896686553955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.591672" }, { "step": 6112, "loss": 0.6265695095062256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.687729" }, { "step": 6113, "loss": 0.5818986892700195, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.777304" }, { "step": 6114, "loss": 0.9088456034660339, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.863425" }, { "step": 6115, "loss": 0.6900248527526855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:23.964800" }, { "step": 6116, "loss": 0.3964826762676239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.067199" }, { "step": 6117, "loss": 0.7345868349075317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.205027" }, { "step": 6118, "loss": 0.41395455598831177, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.296069" }, { "step": 6119, "loss": 1.1220526695251465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.393169" }, { "step": 6120, "loss": 0.8563897609710693, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.491560" }, { "step": 6121, "loss": 1.0200711488723755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.577347" }, { "step": 6122, "loss": 0.5283295512199402, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.674769" }, { "step": 6123, "loss": 0.917076826095581, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.760761" }, { "step": 6124, "loss": 0.696611762046814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.849211" }, { "step": 6125, "loss": 0.6842105984687805, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:24.940166" }, { "step": 6126, "loss": 0.6654537916183472, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.026064" }, { "step": 6127, "loss": 0.616374671459198, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.114040" }, { "step": 6128, "loss": 0.5323957800865173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.218093" }, { "step": 6129, "loss": 0.5260007977485657, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.302839" }, { "step": 6130, "loss": 0.565647304058075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.390069" }, { "step": 6131, "loss": 0.7233959436416626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.501898" }, { "step": 6132, "loss": 0.7969452142715454, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.603588" }, { "step": 6133, "loss": 0.7671277523040771, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.715824" }, { "step": 6134, "loss": 0.5498633980751038, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.805769" }, { "step": 6135, "loss": 0.3354019522666931, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.901781" }, { "step": 6136, "loss": 0.4344443082809448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:25.992881" }, { "step": 6137, "loss": 0.8911557197570801, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.099114" }, { "step": 6138, "loss": 0.6707971096038818, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.214678" }, { "step": 6139, "loss": 0.32634103298187256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.311696" }, { "step": 6140, "loss": 0.554180920124054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.437102" }, { "step": 6141, "loss": 0.8855167627334595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.532275" }, { "step": 6142, "loss": 0.7118990421295166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.641414" }, { "step": 6143, "loss": 0.4467892050743103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.738111" }, { "step": 6144, "loss": 0.4914010763168335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.823459" }, { "step": 6145, "loss": 0.28199493885040283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:26.918345" }, { "step": 6146, "loss": 0.5531553626060486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.030912" }, { "step": 6147, "loss": 0.8737422227859497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.116259" }, { "step": 6148, "loss": 0.5778127312660217, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.215120" }, { "step": 6149, "loss": 0.3343074917793274, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.312107" }, { "step": 6150, "loss": 0.4841850697994232, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.397093" }, { "step": 6151, "loss": 0.5876168608665466, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.526000" }, { "step": 6152, "loss": 0.7582937479019165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.643911" }, { "step": 6153, "loss": 1.1223987340927124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.735880" }, { "step": 6154, "loss": 0.5786006450653076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.851592" }, { "step": 6155, "loss": 0.6081874370574951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:27.971116" }, { "step": 6156, "loss": 0.4743907153606415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.066488" }, { "step": 6157, "loss": 0.44871988892555237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.166628" }, { "step": 6158, "loss": 0.3820360004901886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.269213" }, { "step": 6159, "loss": 0.49175941944122314, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.355836" }, { "step": 6160, "loss": 0.8096224069595337, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.442617" }, { "step": 6161, "loss": 0.6126245260238647, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.562493" }, { "step": 6162, "loss": 0.5555432438850403, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.654284" }, { "step": 6163, "loss": 0.6888037919998169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.768742" }, { "step": 6164, "loss": 0.3117940127849579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.855117" }, { "step": 6165, "loss": 0.42697927355766296, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:28.941166" }, { "step": 6166, "loss": 0.46788835525512695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.035511" }, { "step": 6167, "loss": 0.4702626168727875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.124947" }, { "step": 6168, "loss": 0.7116363644599915, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.209939" }, { "step": 6169, "loss": 1.1561410427093506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.296030" }, { "step": 6170, "loss": 0.7994515299797058, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.398418" }, { "step": 6171, "loss": 0.5804927945137024, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.499833" }, { "step": 6172, "loss": 0.7676964998245239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.590220" }, { "step": 6173, "loss": 0.5607702732086182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.677558" }, { "step": 6174, "loss": 0.4281245470046997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.773034" }, { "step": 6175, "loss": 0.5704138278961182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.900983" }, { "step": 6176, "loss": 0.6126593351364136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:29.985955" }, { "step": 6177, "loss": 0.723376989364624, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.073407" }, { "step": 6178, "loss": 0.5667096972465515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.161006" }, { "step": 6179, "loss": 0.5877907276153564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.256784" }, { "step": 6180, "loss": 0.5821288228034973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.356266" }, { "step": 6181, "loss": 0.3829980492591858, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.448317" }, { "step": 6182, "loss": 0.9123069643974304, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.533949" }, { "step": 6183, "loss": 0.6496587991714478, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.629151" }, { "step": 6184, "loss": 0.5071865916252136, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.722299" }, { "step": 6185, "loss": 0.36144667863845825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.810074" }, { "step": 6186, "loss": 0.4881129562854767, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.902598" }, { "step": 6187, "loss": 0.6624890565872192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:30.995470" }, { "step": 6188, "loss": 0.9368466138839722, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.103428" }, { "step": 6189, "loss": 0.7018129825592041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.190543" }, { "step": 6190, "loss": 0.7311846017837524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.291590" }, { "step": 6191, "loss": 0.46165144443511963, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.386956" }, { "step": 6192, "loss": 0.4876716136932373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.478871" }, { "step": 6193, "loss": 0.6770554780960083, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.564006" }, { "step": 6194, "loss": 0.44380831718444824, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.649766" }, { "step": 6195, "loss": 0.639247715473175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.761959" }, { "step": 6196, "loss": 0.512298047542572, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.870508" }, { "step": 6197, "loss": 0.8135342597961426, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:31.964777" }, { "step": 6198, "loss": 0.7690884470939636, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.052360" }, { "step": 6199, "loss": 0.710663378238678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.163466" }, { "step": 6200, "loss": 0.42232227325439453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.259563" }, { "step": 6201, "loss": 0.6505785584449768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.352245" }, { "step": 6202, "loss": 0.5738650560379028, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.445593" }, { "step": 6203, "loss": 0.34725049138069153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.534201" }, { "step": 6204, "loss": 0.40421760082244873, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.619369" }, { "step": 6205, "loss": 0.68107670545578, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.709861" }, { "step": 6206, "loss": 0.7288432121276855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.826509" }, { "step": 6207, "loss": 0.5188334584236145, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:32.918573" }, { "step": 6208, "loss": 0.8520140647888184, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.000893" }, { "step": 6209, "loss": 0.48681366443634033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.099997" }, { "step": 6210, "loss": 0.5245826840400696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.194058" }, { "step": 6211, "loss": 0.9201465845108032, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.281439" }, { "step": 6212, "loss": 0.3875106871128082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.376469" }, { "step": 6213, "loss": 0.6894509792327881, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.461889" }, { "step": 6214, "loss": 0.6129262447357178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.572650" }, { "step": 6215, "loss": 0.6622169017791748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.684699" }, { "step": 6216, "loss": 0.4957939386367798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.779957" }, { "step": 6217, "loss": 0.5606727600097656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.870561" }, { "step": 6218, "loss": 0.3814239501953125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:33.969209" }, { "step": 6219, "loss": 0.5905487537384033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.055543" }, { "step": 6220, "loss": 0.8953887224197388, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.168977" }, { "step": 6221, "loss": 0.6173405051231384, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.254226" }, { "step": 6222, "loss": 0.5596919059753418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.359120" }, { "step": 6223, "loss": 0.5500471591949463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.446680" }, { "step": 6224, "loss": 0.47410470247268677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.535111" }, { "step": 6225, "loss": 0.4437229335308075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.627958" }, { "step": 6226, "loss": 0.7154930830001831, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.719586" }, { "step": 6227, "loss": 0.5827082991600037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.805001" }, { "step": 6228, "loss": 0.5756665468215942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:34.917876" }, { "step": 6229, "loss": 0.4154932200908661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.010640" }, { "step": 6230, "loss": 0.4750278890132904, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.101081" }, { "step": 6231, "loss": 1.011777400970459, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.188184" }, { "step": 6232, "loss": 0.6876579523086548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.281319" }, { "step": 6233, "loss": 0.702106237411499, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.374140" }, { "step": 6234, "loss": 0.6607829332351685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.462090" }, { "step": 6235, "loss": 0.6730384826660156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.562426" }, { "step": 6236, "loss": 0.6872947216033936, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.669105" }, { "step": 6237, "loss": 0.7261269092559814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.780267" }, { "step": 6238, "loss": 0.4939216375350952, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.871476" }, { "step": 6239, "loss": 0.5133702754974365, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:35.965114" }, { "step": 6240, "loss": 0.6475589275360107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.050601" }, { "step": 6241, "loss": 0.7566269636154175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.147120" }, { "step": 6242, "loss": 0.866095781326294, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.233813" }, { "step": 6243, "loss": 0.6116417646408081, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.327824" }, { "step": 6244, "loss": 0.7208198308944702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.418144" }, { "step": 6245, "loss": 0.419526606798172, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.504829" }, { "step": 6246, "loss": 0.6186727285385132, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.599828" }, { "step": 6247, "loss": 0.9123624563217163, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.744166" }, { "step": 6248, "loss": 0.6505504846572876, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.841585" }, { "step": 6249, "loss": 0.5360574722290039, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:36.935149" }, { "step": 6250, "loss": 0.6729886531829834, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.046623" }, { "step": 6251, "loss": 0.5086688995361328, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.144636" }, { "step": 6252, "loss": 0.6018866896629333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.229963" }, { "step": 6253, "loss": 0.5599005818367004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.330833" }, { "step": 6254, "loss": 0.7703899145126343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.417386" }, { "step": 6255, "loss": 0.7988743185997009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.509308" }, { "step": 6256, "loss": 0.5077551603317261, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.607585" }, { "step": 6257, "loss": 0.8151975274085999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.698354" }, { "step": 6258, "loss": 0.7634936571121216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.785222" }, { "step": 6259, "loss": 1.0715218782424927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.870247" }, { "step": 6260, "loss": 0.5514628887176514, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:37.984517" }, { "step": 6261, "loss": 0.5146123170852661, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.078408" }, { "step": 6262, "loss": 0.5536665916442871, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.174611" }, { "step": 6263, "loss": 0.49443674087524414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.274270" }, { "step": 6264, "loss": 0.7307000756263733, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.387723" }, { "step": 6265, "loss": 0.7906379699707031, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.472980" }, { "step": 6266, "loss": 0.5734117031097412, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.584650" }, { "step": 6267, "loss": 0.7739447355270386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.696972" }, { "step": 6268, "loss": 0.6820046305656433, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.782246" }, { "step": 6269, "loss": 0.4934352934360504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.869293" }, { "step": 6270, "loss": 0.3127121329307556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:38.961838" }, { "step": 6271, "loss": 0.5429365634918213, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.049908" }, { "step": 6272, "loss": 0.4670722484588623, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.148206" }, { "step": 6273, "loss": 0.6259282827377319, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.241886" }, { "step": 6274, "loss": 0.9748526811599731, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.331330" }, { "step": 6275, "loss": 0.7041574716567993, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.418741" }, { "step": 6276, "loss": 0.4656667113304138, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.514167" }, { "step": 6277, "loss": 0.6378016471862793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.626769" }, { "step": 6278, "loss": 1.0085783004760742, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.736630" }, { "step": 6279, "loss": 0.3095834255218506, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.831835" }, { "step": 6280, "loss": 0.9392074942588806, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:39.925578" }, { "step": 6281, "loss": 0.5450550317764282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.011864" }, { "step": 6282, "loss": 0.4355108141899109, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.109349" }, { "step": 6283, "loss": 0.9026005268096924, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.194288" }, { "step": 6284, "loss": 0.368243545293808, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.283310" }, { "step": 6285, "loss": 0.28598177433013916, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.372877" }, { "step": 6286, "loss": 0.42897868156433105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.471762" }, { "step": 6287, "loss": 0.43608564138412476, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.564729" }, { "step": 6288, "loss": 0.5065657496452332, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.663352" }, { "step": 6289, "loss": 0.5032735466957092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.762990" }, { "step": 6290, "loss": 0.4838296175003052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.851295" }, { "step": 6291, "loss": 0.3642818331718445, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:40.944003" }, { "step": 6292, "loss": 0.7171934247016907, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.037871" }, { "step": 6293, "loss": 0.9416482448577881, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.129817" }, { "step": 6294, "loss": 0.7996700406074524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.215793" }, { "step": 6295, "loss": 0.5970252752304077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.306505" }, { "step": 6296, "loss": 0.8043294548988342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.419471" }, { "step": 6297, "loss": 0.4546054005622864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.521208" }, { "step": 6298, "loss": 0.6155726313591003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.608782" }, { "step": 6299, "loss": 0.7548624873161316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.697139" }, { "step": 6300, "loss": 0.5953279137611389, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.809758" }, { "step": 6301, "loss": 0.767281711101532, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.902374" }, { "step": 6302, "loss": 0.8012354373931885, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:41.996673" }, { "step": 6303, "loss": 0.5301434993743896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.081294" }, { "step": 6304, "loss": 0.7540048956871033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.194191" }, { "step": 6305, "loss": 0.5523827075958252, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.283714" }, { "step": 6306, "loss": 0.5739606618881226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.368858" }, { "step": 6307, "loss": 0.30282601714134216, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.461939" }, { "step": 6308, "loss": 0.6730145812034607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.548060" }, { "step": 6309, "loss": 0.6944665908813477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.648083" }, { "step": 6310, "loss": 0.6206762790679932, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.735134" }, { "step": 6311, "loss": 0.6220253705978394, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.821111" }, { "step": 6312, "loss": 0.7077118754386902, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:42.909547" }, { "step": 6313, "loss": 0.5000742673873901, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.009734" }, { "step": 6314, "loss": 0.5229472517967224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.128907" }, { "step": 6315, "loss": 0.6942508816719055, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.216087" }, { "step": 6316, "loss": 0.6792352199554443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.302623" }, { "step": 6317, "loss": 0.6978082656860352, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.388939" }, { "step": 6318, "loss": 0.6732025146484375, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.496903" }, { "step": 6319, "loss": 0.5400512218475342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.592336" }, { "step": 6320, "loss": 0.5309999585151672, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.692838" }, { "step": 6321, "loss": 0.46460145711898804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.784473" }, { "step": 6322, "loss": 0.5035190582275391, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.869287" }, { "step": 6323, "loss": 0.580161988735199, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:43.982418" }, { "step": 6324, "loss": 0.7992140054702759, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.072827" }, { "step": 6325, "loss": 0.5118222236633301, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.164984" }, { "step": 6326, "loss": 0.5756047964096069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.257850" }, { "step": 6327, "loss": 0.4446382224559784, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.350297" }, { "step": 6328, "loss": 0.7451249957084656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.464969" }, { "step": 6329, "loss": 0.4324912428855896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.552736" }, { "step": 6330, "loss": 1.0400350093841553, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.655041" }, { "step": 6331, "loss": 0.9117248058319092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.750915" }, { "step": 6332, "loss": 0.36369311809539795, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.844944" }, { "step": 6333, "loss": 0.6019083857536316, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:44.938589" }, { "step": 6334, "loss": 0.545694887638092, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.035423" }, { "step": 6335, "loss": 0.6171921491622925, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.154230" }, { "step": 6336, "loss": 0.6260440945625305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.238929" }, { "step": 6337, "loss": 0.46121078729629517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.328333" }, { "step": 6338, "loss": 0.5168965458869934, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.427412" }, { "step": 6339, "loss": 0.6688066720962524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.518880" }, { "step": 6340, "loss": 0.441791296005249, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.604130" }, { "step": 6341, "loss": 0.9849148988723755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.713763" }, { "step": 6342, "loss": 0.6957781314849854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.820886" }, { "step": 6343, "loss": 0.33100566267967224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:45.920120" }, { "step": 6344, "loss": 1.0025187730789185, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.036446" }, { "step": 6345, "loss": 0.30764707922935486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.130588" }, { "step": 6346, "loss": 0.8095039129257202, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.235909" }, { "step": 6347, "loss": 0.29954808950424194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.329025" }, { "step": 6348, "loss": 0.7035155296325684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.423722" }, { "step": 6349, "loss": 0.5967724919319153, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.525993" }, { "step": 6350, "loss": 0.5569347143173218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.613568" }, { "step": 6351, "loss": 0.9073099493980408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.699313" }, { "step": 6352, "loss": 0.40581560134887695, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.787148" }, { "step": 6353, "loss": 0.779694676399231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.876738" }, { "step": 6354, "loss": 0.29005149006843567, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:46.968592" }, { "step": 6355, "loss": 0.6681325435638428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.083035" }, { "step": 6356, "loss": 0.6082847714424133, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.200433" }, { "step": 6357, "loss": 0.5362951755523682, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.285731" }, { "step": 6358, "loss": 0.6285179853439331, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.372208" }, { "step": 6359, "loss": 0.5899950265884399, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.456903" }, { "step": 6360, "loss": 0.8882100582122803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.555399" }, { "step": 6361, "loss": 0.867702066898346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.653085" }, { "step": 6362, "loss": 0.6006908416748047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.743662" }, { "step": 6363, "loss": 0.5993177890777588, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.856552" }, { "step": 6364, "loss": 0.5409923791885376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:47.947605" }, { "step": 6365, "loss": 0.43506768345832825, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.039855" }, { "step": 6366, "loss": 0.8319679498672485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.171506" }, { "step": 6367, "loss": 0.9495471715927124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.300959" }, { "step": 6368, "loss": 0.5331530570983887, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.390470" }, { "step": 6369, "loss": 0.649779200553894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.477804" }, { "step": 6370, "loss": 0.9702825546264648, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.569700" }, { "step": 6371, "loss": 0.4172232747077942, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.653754" }, { "step": 6372, "loss": 0.9267650842666626, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.775037" }, { "step": 6373, "loss": 0.4439520835876465, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.861002" }, { "step": 6374, "loss": 0.37958747148513794, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:48.947028" }, { "step": 6375, "loss": 0.767565131187439, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.033880" }, { "step": 6376, "loss": 0.7804242968559265, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.143728" }, { "step": 6377, "loss": 0.7783997058868408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.229047" }, { "step": 6378, "loss": 0.7400903701782227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.342217" }, { "step": 6379, "loss": 0.36445552110671997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.427496" }, { "step": 6380, "loss": 0.5914322733879089, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.513471" }, { "step": 6381, "loss": 1.1309664249420166, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.599514" }, { "step": 6382, "loss": 1.0028142929077148, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.687275" }, { "step": 6383, "loss": 0.46705400943756104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.782760" }, { "step": 6384, "loss": 0.9330031871795654, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.891030" }, { "step": 6385, "loss": 0.570243775844574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:49.983175" }, { "step": 6386, "loss": 0.678217887878418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.070402" }, { "step": 6387, "loss": 0.7642984390258789, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.163847" }, { "step": 6388, "loss": 0.6693288087844849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.276068" }, { "step": 6389, "loss": 0.7267515659332275, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.363240" }, { "step": 6390, "loss": 0.36089998483657837, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.458326" }, { "step": 6391, "loss": 0.7351325154304504, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.543886" }, { "step": 6392, "loss": 0.8005961179733276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.659804" }, { "step": 6393, "loss": 0.5690693259239197, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.746386" }, { "step": 6394, "loss": 0.8868036270141602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.852220" }, { "step": 6395, "loss": 0.5288759469985962, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:50.948615" }, { "step": 6396, "loss": 0.5196219682693481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.041852" }, { "step": 6397, "loss": 0.6087974309921265, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.150057" }, { "step": 6398, "loss": 0.39441558718681335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.239155" }, { "step": 6399, "loss": 1.0404351949691772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.358388" }, { "step": 6400, "loss": 0.6500221490859985, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.444858" }, { "step": 6401, "loss": 0.46609270572662354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.535536" }, { "step": 6402, "loss": 0.6273354291915894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.621540" }, { "step": 6403, "loss": 0.38496536016464233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.713331" }, { "step": 6404, "loss": 0.4694717824459076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.798690" }, { "step": 6405, "loss": 0.8232845664024353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:51.892149" }, { "step": 6406, "loss": 0.5823301672935486, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.018368" }, { "step": 6407, "loss": 0.4932924211025238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.110777" }, { "step": 6408, "loss": 0.8260810375213623, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.220691" }, { "step": 6409, "loss": 0.9444504976272583, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.315229" }, { "step": 6410, "loss": 0.5632715821266174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.403935" }, { "step": 6411, "loss": 0.5504027605056763, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.495442" }, { "step": 6412, "loss": 0.5552188754081726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.587680" }, { "step": 6413, "loss": 0.7332128286361694, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.692852" }, { "step": 6414, "loss": 0.7946691513061523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.786821" }, { "step": 6415, "loss": 0.37495750188827515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.872842" }, { "step": 6416, "loss": 0.7438879013061523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:52.962669" }, { "step": 6417, "loss": 0.9557035565376282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.048247" }, { "step": 6418, "loss": 0.5316675901412964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.140421" }, { "step": 6419, "loss": 0.8784071207046509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.253341" }, { "step": 6420, "loss": 0.6733697652816772, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.372892" }, { "step": 6421, "loss": 0.44138339161872864, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.473487" }, { "step": 6422, "loss": 0.4413182735443115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.557996" }, { "step": 6423, "loss": 0.5982128381729126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.647978" }, { "step": 6424, "loss": 0.7189118266105652, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.760922" }, { "step": 6425, "loss": 0.567934513092041, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.846099" }, { "step": 6426, "loss": 0.8171558976173401, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:53.957689" }, { "step": 6427, "loss": 1.0058900117874146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.043773" }, { "step": 6428, "loss": 0.5668252110481262, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.133634" }, { "step": 6429, "loss": 0.701871395111084, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.218562" }, { "step": 6430, "loss": 0.5949009656906128, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.307866" }, { "step": 6431, "loss": 0.7582738399505615, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.419744" }, { "step": 6432, "loss": 0.9129679203033447, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.559473" }, { "step": 6433, "loss": 0.6572219729423523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.673946" }, { "step": 6434, "loss": 0.7131524682044983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.759362" }, { "step": 6435, "loss": 0.7129335403442383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.846017" }, { "step": 6436, "loss": 0.5648126602172852, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:54.942201" }, { "step": 6437, "loss": 0.5731122493743896, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.026370" }, { "step": 6438, "loss": 0.7049902677536011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.126404" }, { "step": 6439, "loss": 0.5838109254837036, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.226423" }, { "step": 6440, "loss": 0.7676843404769897, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.340073" }, { "step": 6441, "loss": 0.7061595916748047, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.425791" }, { "step": 6442, "loss": 0.6178785562515259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.545951" }, { "step": 6443, "loss": 0.7062087059020996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.631205" }, { "step": 6444, "loss": 0.7118951082229614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.748522" }, { "step": 6445, "loss": 0.40215861797332764, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.845154" }, { "step": 6446, "loss": 0.534657895565033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:55.938788" }, { "step": 6447, "loss": 0.5757545232772827, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.030645" }, { "step": 6448, "loss": 0.7902935743331909, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.141353" }, { "step": 6449, "loss": 0.7291362881660461, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.251824" }, { "step": 6450, "loss": 0.7224245071411133, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.363293" }, { "step": 6451, "loss": 0.4519415497779846, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.449918" }, { "step": 6452, "loss": 1.0354665517807007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.562997" }, { "step": 6453, "loss": 0.6760869026184082, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.676847" }, { "step": 6454, "loss": 0.5934470891952515, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.763672" }, { "step": 6455, "loss": 0.8370603322982788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.848701" }, { "step": 6456, "loss": 0.8545504808425903, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:56.933723" }, { "step": 6457, "loss": 0.7890991568565369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.051387" }, { "step": 6458, "loss": 0.43196022510528564, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.154271" }, { "step": 6459, "loss": 0.6366801857948303, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.245918" }, { "step": 6460, "loss": 0.4760149121284485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.331726" }, { "step": 6461, "loss": 0.7560886740684509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.452761" }, { "step": 6462, "loss": 0.6035783290863037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.560720" }, { "step": 6463, "loss": 0.7388036251068115, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.668586" }, { "step": 6464, "loss": 0.46502822637557983, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.782676" }, { "step": 6465, "loss": 0.6074619889259338, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.879249" }, { "step": 6466, "loss": 0.5226253271102905, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:57.975354" }, { "step": 6467, "loss": 0.2697044909000397, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.062291" }, { "step": 6468, "loss": 0.5055438280105591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.155011" }, { "step": 6469, "loss": 0.40285637974739075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.242280" }, { "step": 6470, "loss": 0.5922590494155884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.336286" }, { "step": 6471, "loss": 0.5589722394943237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.431296" }, { "step": 6472, "loss": 0.808468222618103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.524174" }, { "step": 6473, "loss": 0.8804335594177246, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.611463" }, { "step": 6474, "loss": 0.4047338366508484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.696657" }, { "step": 6475, "loss": 0.7406995296478271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.788731" }, { "step": 6476, "loss": 0.5834305286407471, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.873529" }, { "step": 6477, "loss": 0.48559579253196716, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:58.958407" }, { "step": 6478, "loss": 0.49481505155563354, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.051509" }, { "step": 6479, "loss": 0.42955416440963745, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.135588" }, { "step": 6480, "loss": 0.4411671757698059, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.257864" }, { "step": 6481, "loss": 0.35411280393600464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.349701" }, { "step": 6482, "loss": 0.6288315057754517, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.435084" }, { "step": 6483, "loss": 0.4331166446208954, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.519982" }, { "step": 6484, "loss": 0.620365560054779, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.612994" }, { "step": 6485, "loss": 0.5179921388626099, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.705026" }, { "step": 6486, "loss": 0.5572370290756226, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.831519" }, { "step": 6487, "loss": 0.9062818288803101, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:37:59.946553" }, { "step": 6488, "loss": 0.4073321223258972, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.031485" }, { "step": 6489, "loss": 1.3687680959701538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.116243" }, { "step": 6490, "loss": 0.8169151544570923, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.200900" }, { "step": 6491, "loss": 0.5629265904426575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.312895" }, { "step": 6492, "loss": 0.46778005361557007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.405173" }, { "step": 6493, "loss": 0.5748388171195984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.492220" }, { "step": 6494, "loss": 0.7700413465499878, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.609826" }, { "step": 6495, "loss": 0.8548378348350525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.724586" }, { "step": 6496, "loss": 0.7406154870986938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.816302" }, { "step": 6497, "loss": 0.7838739156723022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:00.916243" }, { "step": 6498, "loss": 1.0447347164154053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:01.002111" }, { "step": 6499, "loss": 0.80810546875, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:01.096123" }, { "step": 6500, "loss": 0.7496809363365173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:01.190059" }, { "step": 6501, "loss": 0.5718775987625122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:23.958679" }, { "step": 6502, "loss": 0.7607216238975525, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.054348" }, { "step": 6503, "loss": 0.7079184055328369, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.152203" }, { "step": 6504, "loss": 0.42673903703689575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.250524" }, { "step": 6505, "loss": 0.5730708241462708, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.346038" }, { "step": 6506, "loss": 0.9207318425178528, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.432254" }, { "step": 6507, "loss": 0.4962609112262726, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.528012" }, { "step": 6508, "loss": 0.5348815321922302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.622435" }, { "step": 6509, "loss": 1.0084362030029297, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.708978" }, { "step": 6510, "loss": 0.7207714319229126, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.802804" }, { "step": 6511, "loss": 0.7057323455810547, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.896474" }, { "step": 6512, "loss": 0.9689807891845703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:24.983397" }, { "step": 6513, "loss": 0.5322166681289673, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.077510" }, { "step": 6514, "loss": 0.4633530378341675, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.170986" }, { "step": 6515, "loss": 0.7246432304382324, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.257174" }, { "step": 6516, "loss": 0.8686330318450928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.372666" }, { "step": 6517, "loss": 0.6254326105117798, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.458709" }, { "step": 6518, "loss": 0.5828774571418762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.545925" }, { "step": 6519, "loss": 0.7681803703308105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.656041" }, { "step": 6520, "loss": 0.8938332796096802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.763707" }, { "step": 6521, "loss": 0.6462203860282898, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.886586" }, { "step": 6522, "loss": 0.5555833578109741, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:25.974226" }, { "step": 6523, "loss": 0.5278570055961609, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.060215" }, { "step": 6524, "loss": 0.9372580051422119, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.145407" }, { "step": 6525, "loss": 0.6053892374038696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.231230" }, { "step": 6526, "loss": 0.8877164125442505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.345481" }, { "step": 6527, "loss": 0.9300044775009155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.452896" }, { "step": 6528, "loss": 0.38609829545021057, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.552290" }, { "step": 6529, "loss": 0.43732935190200806, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.639219" }, { "step": 6530, "loss": 0.5554901957511902, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.752713" }, { "step": 6531, "loss": 0.8562772274017334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.837772" }, { "step": 6532, "loss": 0.7681955099105835, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:26.928997" }, { "step": 6533, "loss": 0.7113929390907288, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.047142" }, { "step": 6534, "loss": 0.8039495944976807, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.140187" }, { "step": 6535, "loss": 0.9218994379043579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.241800" }, { "step": 6536, "loss": 0.4602271318435669, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.328590" }, { "step": 6537, "loss": 0.4448550343513489, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.423934" }, { "step": 6538, "loss": 0.3331248462200165, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.510872" }, { "step": 6539, "loss": 0.771807074546814, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.622676" }, { "step": 6540, "loss": 0.678192675113678, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.741673" }, { "step": 6541, "loss": 0.5807997584342957, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.833747" }, { "step": 6542, "loss": 0.9314073324203491, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:27.935870" }, { "step": 6543, "loss": 0.9230140447616577, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.086739" }, { "step": 6544, "loss": 0.545911431312561, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.172672" }, { "step": 6545, "loss": 0.6139267683029175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.265509" }, { "step": 6546, "loss": 0.47048330307006836, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.352275" }, { "step": 6547, "loss": 0.7929593920707703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.466701" }, { "step": 6548, "loss": 0.8723453283309937, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.579186" }, { "step": 6549, "loss": 0.4300304651260376, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.672592" }, { "step": 6550, "loss": 0.3975569009780884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.766080" }, { "step": 6551, "loss": 0.7543348073959351, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.851589" }, { "step": 6552, "loss": 0.7509171962738037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:28.942298" }, { "step": 6553, "loss": 0.469180703163147, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.030500" }, { "step": 6554, "loss": 0.7437772750854492, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.115893" }, { "step": 6555, "loss": 0.880293607711792, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.200314" }, { "step": 6556, "loss": 0.5832271575927734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.305873" }, { "step": 6557, "loss": 0.508962094783783, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.395373" }, { "step": 6558, "loss": 0.7911062240600586, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.513635" }, { "step": 6559, "loss": 0.6930934190750122, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.637151" }, { "step": 6560, "loss": 0.6781342029571533, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.722330" }, { "step": 6561, "loss": 0.9125913381576538, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.836172" }, { "step": 6562, "loss": 0.5547957420349121, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:29.921551" }, { "step": 6563, "loss": 0.4035916328430176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.022142" }, { "step": 6564, "loss": 0.7288714051246643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.109453" }, { "step": 6565, "loss": 0.8527460098266602, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.200795" }, { "step": 6566, "loss": 1.051340937614441, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.308387" }, { "step": 6567, "loss": 0.4572821259498596, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.394129" }, { "step": 6568, "loss": 0.5988417267799377, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.517097" }, { "step": 6569, "loss": 0.5102770924568176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.608764" }, { "step": 6570, "loss": 0.5857046246528625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.695691" }, { "step": 6571, "loss": 0.49113160371780396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.785378" }, { "step": 6572, "loss": 0.9141313433647156, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:30.927768" }, { "step": 6573, "loss": 0.8768999576568604, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.046801" }, { "step": 6574, "loss": 0.5414029955863953, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.142453" }, { "step": 6575, "loss": 0.6278074979782104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.240188" }, { "step": 6576, "loss": 0.6105265617370605, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.330758" }, { "step": 6577, "loss": 0.7016572952270508, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.443572" }, { "step": 6578, "loss": 0.40226590633392334, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.537699" }, { "step": 6579, "loss": 0.8068504929542542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.625925" }, { "step": 6580, "loss": 0.3934681713581085, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.718999" }, { "step": 6581, "loss": 0.43979960680007935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.813595" }, { "step": 6582, "loss": 0.3331253230571747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:31.910309" }, { "step": 6583, "loss": 0.4773254692554474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.023138" }, { "step": 6584, "loss": 0.3055501878261566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.115423" }, { "step": 6585, "loss": 0.49924135208129883, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.201588" }, { "step": 6586, "loss": 0.5223972201347351, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.318778" }, { "step": 6587, "loss": 0.9142379760742188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.411859" }, { "step": 6588, "loss": 0.888038694858551, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.507474" }, { "step": 6589, "loss": 0.5524660348892212, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.594214" }, { "step": 6590, "loss": 0.6237573623657227, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.706920" }, { "step": 6591, "loss": 0.5764040946960449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.792235" }, { "step": 6592, "loss": 0.7707505822181702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.880949" }, { "step": 6593, "loss": 0.7573703527450562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:32.971022" }, { "step": 6594, "loss": 0.4940679669380188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.093627" }, { "step": 6595, "loss": 0.679108738899231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.209895" }, { "step": 6596, "loss": 0.7582385540008545, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.294512" }, { "step": 6597, "loss": 0.4990045428276062, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.383821" }, { "step": 6598, "loss": 0.6289004683494568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.475848" }, { "step": 6599, "loss": 0.4485635757446289, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.565174" }, { "step": 6600, "loss": 0.5954365730285645, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.667398" }, { "step": 6601, "loss": 0.6184263229370117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.766180" }, { "step": 6602, "loss": 0.7346186637878418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.860790" }, { "step": 6603, "loss": 0.6232471466064453, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:33.947693" }, { "step": 6604, "loss": 0.48909997940063477, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.056355" }, { "step": 6605, "loss": 0.6522293090820312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.141734" }, { "step": 6606, "loss": 0.5881629586219788, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.232117" }, { "step": 6607, "loss": 0.5301710963249207, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.315987" }, { "step": 6608, "loss": 0.6691557168960571, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.405026" }, { "step": 6609, "loss": 0.7894471883773804, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.519849" }, { "step": 6610, "loss": 0.6892940402030945, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.635954" }, { "step": 6611, "loss": 0.865957498550415, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.749558" }, { "step": 6612, "loss": 0.46057644486427307, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.840426" }, { "step": 6613, "loss": 0.43971261382102966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:34.935750" }, { "step": 6614, "loss": 0.4120802879333496, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.032753" }, { "step": 6615, "loss": 0.6206681728363037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.135923" }, { "step": 6616, "loss": 0.6724217534065247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.223612" }, { "step": 6617, "loss": 0.7365994453430176, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.309407" }, { "step": 6618, "loss": 0.7109485864639282, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.394633" }, { "step": 6619, "loss": 0.3324768841266632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.481475" }, { "step": 6620, "loss": 0.30593276023864746, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.567409" }, { "step": 6621, "loss": 0.6922541856765747, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.653354" }, { "step": 6622, "loss": 0.5567560791969299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.738354" }, { "step": 6623, "loss": 0.2916727662086487, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.824333" }, { "step": 6624, "loss": 0.585015594959259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.909414" }, { "step": 6625, "loss": 0.606807291507721, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:35.994495" }, { "step": 6626, "loss": 0.5947337746620178, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.082179" }, { "step": 6627, "loss": 0.8387292623519897, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.197781" }, { "step": 6628, "loss": 0.41898447275161743, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.287451" }, { "step": 6629, "loss": 0.8490936756134033, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.373680" }, { "step": 6630, "loss": 0.4663428068161011, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.461922" }, { "step": 6631, "loss": 0.5857738256454468, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.546207" }, { "step": 6632, "loss": 0.856058657169342, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.632416" }, { "step": 6633, "loss": 0.6666042804718018, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.725507" }, { "step": 6634, "loss": 0.4238922894001007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.812038" }, { "step": 6635, "loss": 0.5705159902572632, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:36.931641" }, { "step": 6636, "loss": 0.6376564502716064, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.019218" }, { "step": 6637, "loss": 0.5498673319816589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.113822" }, { "step": 6638, "loss": 0.45882272720336914, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.206522" }, { "step": 6639, "loss": 0.515806257724762, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.307221" }, { "step": 6640, "loss": 0.6483088135719299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.400727" }, { "step": 6641, "loss": 0.7616209387779236, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.516103" }, { "step": 6642, "loss": 0.4651957154273987, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.601262" }, { "step": 6643, "loss": 0.5420808792114258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.686658" }, { "step": 6644, "loss": 0.7768049240112305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.781132" }, { "step": 6645, "loss": 0.5113135576248169, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.868685" }, { "step": 6646, "loss": 0.5571600794792175, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:37.956576" }, { "step": 6647, "loss": 0.8856362104415894, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.071609" }, { "step": 6648, "loss": 0.5917225480079651, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.189321" }, { "step": 6649, "loss": 0.7045584917068481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.299354" }, { "step": 6650, "loss": 0.40922269225120544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.380864" }, { "step": 6651, "loss": 0.496155321598053, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.484736" }, { "step": 6652, "loss": 0.5258066654205322, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.571324" }, { "step": 6653, "loss": 0.5344502925872803, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.655441" }, { "step": 6654, "loss": 0.8345199227333069, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.741225" }, { "step": 6655, "loss": 0.6908277273178101, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.826319" }, { "step": 6656, "loss": 0.9840925931930542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:38.936653" }, { "step": 6657, "loss": 0.37214338779449463, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.026221" }, { "step": 6658, "loss": 0.5742120742797852, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.123336" }, { "step": 6659, "loss": 0.4320451617240906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.210191" }, { "step": 6660, "loss": 0.4155597984790802, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.302586" }, { "step": 6661, "loss": 0.8907472491264343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.387463" }, { "step": 6662, "loss": 0.6543447971343994, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.502121" }, { "step": 6663, "loss": 0.31323695182800293, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.587745" }, { "step": 6664, "loss": 0.429134726524353, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.676944" }, { "step": 6665, "loss": 0.6166415214538574, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.765411" }, { "step": 6666, "loss": 0.4641582667827606, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.855508" }, { "step": 6667, "loss": 0.69957435131073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:39.981333" }, { "step": 6668, "loss": 0.4187595844268799, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.071387" }, { "step": 6669, "loss": 0.6223825216293335, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.165349" }, { "step": 6670, "loss": 0.7143914103507996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.250172" }, { "step": 6671, "loss": 0.6791791915893555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.337984" }, { "step": 6672, "loss": 0.6428103446960449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.451430" }, { "step": 6673, "loss": 0.6243094205856323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.551648" }, { "step": 6674, "loss": 0.8914873003959656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.637859" }, { "step": 6675, "loss": 0.40760040283203125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.729498" }, { "step": 6676, "loss": 0.5596718788146973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.821623" }, { "step": 6677, "loss": 0.7166602611541748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:40.937009" }, { "step": 6678, "loss": 0.8643742799758911, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.056530" }, { "step": 6679, "loss": 0.8075348138809204, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.173929" }, { "step": 6680, "loss": 0.7232601642608643, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.269112" }, { "step": 6681, "loss": 0.46021169424057007, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.360957" }, { "step": 6682, "loss": 0.8104267716407776, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.446927" }, { "step": 6683, "loss": 0.6819745302200317, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.536069" }, { "step": 6684, "loss": 0.3423475921154022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.637214" }, { "step": 6685, "loss": 0.9860988855361938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.723710" }, { "step": 6686, "loss": 0.6956539750099182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.828113" }, { "step": 6687, "loss": 0.6977051496505737, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:41.920979" }, { "step": 6688, "loss": 0.4521843194961548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.018592" }, { "step": 6689, "loss": 0.6500400304794312, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.107734" }, { "step": 6690, "loss": 0.9207979440689087, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.195376" }, { "step": 6691, "loss": 0.6412975788116455, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.291662" }, { "step": 6692, "loss": 0.7185558676719666, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.377138" }, { "step": 6693, "loss": 0.6050735712051392, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.463457" }, { "step": 6694, "loss": 0.5302777290344238, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.559609" }, { "step": 6695, "loss": 0.44616663455963135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.680200" }, { "step": 6696, "loss": 0.5498812794685364, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:42.776542" }, { "step": 6697, "loss": 0.6317995190620422, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.077205" }, { "step": 6698, "loss": 0.6782889366149902, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.202574" }, { "step": 6699, "loss": 1.1636031866073608, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.290053" }, { "step": 6700, "loss": 0.718106746673584, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.378695" }, { "step": 6701, "loss": 0.3461427390575409, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.471456" }, { "step": 6702, "loss": 0.5045347213745117, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.557987" }, { "step": 6703, "loss": 0.8542629480361938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.652168" }, { "step": 6704, "loss": 0.8460635542869568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.737941" }, { "step": 6705, "loss": 0.6330617666244507, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.823204" }, { "step": 6706, "loss": 0.6701945662498474, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:43.920966" }, { "step": 6707, "loss": 0.4014117419719696, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.006093" }, { "step": 6708, "loss": 0.7526146769523621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.115729" }, { "step": 6709, "loss": 0.747364342212677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.243795" }, { "step": 6710, "loss": 0.5567092299461365, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.339268" }, { "step": 6711, "loss": 0.6950647234916687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.448660" }, { "step": 6712, "loss": 0.571933388710022, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.540705" }, { "step": 6713, "loss": 0.5117208361625671, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.625902" }, { "step": 6714, "loss": 0.4796123206615448, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.718289" }, { "step": 6715, "loss": 0.6781532168388367, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.815210" }, { "step": 6716, "loss": 0.547346293926239, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:44.912295" }, { "step": 6717, "loss": 0.5925316214561462, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.004580" }, { "step": 6718, "loss": 0.759526789188385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.092128" }, { "step": 6719, "loss": 0.6991141438484192, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.229503" }, { "step": 6720, "loss": 0.6067473292350769, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.320968" }, { "step": 6721, "loss": 0.3891400694847107, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.412196" }, { "step": 6722, "loss": 0.5409058332443237, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.503210" }, { "step": 6723, "loss": 0.5678142309188843, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.595913" }, { "step": 6724, "loss": 0.49560773372650146, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.688255" }, { "step": 6725, "loss": 0.5430762767791748, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.785869" }, { "step": 6726, "loss": 0.598874568939209, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:45.885221" }, { "step": 6727, "loss": 0.5992564558982849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.006588" }, { "step": 6728, "loss": 0.8619440197944641, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.117060" }, { "step": 6729, "loss": 0.7978758811950684, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.202337" }, { "step": 6730, "loss": 0.5606302618980408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.296066" }, { "step": 6731, "loss": 0.7212406396865845, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.384768" }, { "step": 6732, "loss": 0.4957078695297241, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.477144" }, { "step": 6733, "loss": 0.8728170990943909, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.590612" }, { "step": 6734, "loss": 0.5947080850601196, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.713489" }, { "step": 6735, "loss": 0.8181541562080383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.806806" }, { "step": 6736, "loss": 0.6341598033905029, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.906700" }, { "step": 6737, "loss": 0.8492763042449951, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:46.994065" }, { "step": 6738, "loss": 0.4823187589645386, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.086685" }, { "step": 6739, "loss": 0.6176518201828003, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.176027" }, { "step": 6740, "loss": 0.487766832113266, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.263879" }, { "step": 6741, "loss": 0.8121359348297119, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.382685" }, { "step": 6742, "loss": 0.7172603607177734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.468599" }, { "step": 6743, "loss": 0.6658772230148315, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.570916" }, { "step": 6744, "loss": 0.5100440382957458, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.663192" }, { "step": 6745, "loss": 0.30471742153167725, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.749622" }, { "step": 6746, "loss": 0.38799840211868286, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.834979" }, { "step": 6747, "loss": 0.47374269366264343, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:47.928114" }, { "step": 6748, "loss": 0.3574272096157074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.022208" }, { "step": 6749, "loss": 0.30312013626098633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.111753" }, { "step": 6750, "loss": 0.6658865809440613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.203607" }, { "step": 6751, "loss": 0.7208660840988159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.315428" }, { "step": 6752, "loss": 0.6015994548797607, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.407887" }, { "step": 6753, "loss": 0.7107129693031311, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.495375" }, { "step": 6754, "loss": 0.6377116441726685, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.584848" }, { "step": 6755, "loss": 0.3534013628959656, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.691756" }, { "step": 6756, "loss": 0.501495897769928, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.778103" }, { "step": 6757, "loss": 0.5421551465988159, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.868705" }, { "step": 6758, "loss": 0.6725843548774719, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:48.956530" }, { "step": 6759, "loss": 0.8112684488296509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.091535" }, { "step": 6760, "loss": 0.37435731291770935, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.191051" }, { "step": 6761, "loss": 0.657696545124054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.285538" }, { "step": 6762, "loss": 0.4938851594924927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.371926" }, { "step": 6763, "loss": 0.7952749729156494, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.466128" }, { "step": 6764, "loss": 0.8105409145355225, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.555166" }, { "step": 6765, "loss": 0.6985770463943481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.663826" }, { "step": 6766, "loss": 0.981091320514679, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.748768" }, { "step": 6767, "loss": 0.6178234219551086, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.841461" }, { "step": 6768, "loss": 0.583774745464325, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:49.929058" }, { "step": 6769, "loss": 0.31951016187667847, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.026189" }, { "step": 6770, "loss": 0.5592914819717407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.113775" }, { "step": 6771, "loss": 0.5396174192428589, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.198224" }, { "step": 6772, "loss": 0.6068083047866821, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.303515" }, { "step": 6773, "loss": 0.6999281644821167, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.420316" }, { "step": 6774, "loss": 0.7266169190406799, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.506490" }, { "step": 6775, "loss": 0.7872902154922485, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.602253" }, { "step": 6776, "loss": 0.8609639406204224, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.704600" }, { "step": 6777, "loss": 0.5869332551956177, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.789534" }, { "step": 6778, "loss": 0.6060255765914917, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.882806" }, { "step": 6779, "loss": 0.7994788289070129, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:50.977706" }, { "step": 6780, "loss": 0.6083521246910095, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.073876" }, { "step": 6781, "loss": 0.7665039300918579, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.186854" }, { "step": 6782, "loss": 0.4685409367084503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.271877" }, { "step": 6783, "loss": 0.4758918881416321, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.388935" }, { "step": 6784, "loss": 0.7468501329421997, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.503286" }, { "step": 6785, "loss": 0.7683709263801575, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.591146" }, { "step": 6786, "loss": 0.6121315956115723, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.682921" }, { "step": 6787, "loss": 0.4907922148704529, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.799671" }, { "step": 6788, "loss": 0.5854382514953613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.894001" }, { "step": 6789, "loss": 0.8080897331237793, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:51.986686" }, { "step": 6790, "loss": 0.4253283739089966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.075903" }, { "step": 6791, "loss": 0.7618297338485718, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.188302" }, { "step": 6792, "loss": 0.6328038573265076, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.275569" }, { "step": 6793, "loss": 1.1379683017730713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.368435" }, { "step": 6794, "loss": 0.7771043181419373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.509167" }, { "step": 6795, "loss": 0.51761794090271, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.610543" }, { "step": 6796, "loss": 0.7974687814712524, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.697385" }, { "step": 6797, "loss": 0.8792307376861572, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.783783" }, { "step": 6798, "loss": 0.9878754019737244, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.868363" }, { "step": 6799, "loss": 0.7563262581825256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:52.966017" }, { "step": 6800, "loss": 0.7755602598190308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.051661" }, { "step": 6801, "loss": 0.5006741881370544, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.144969" }, { "step": 6802, "loss": 0.7733948230743408, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.259756" }, { "step": 6803, "loss": 0.5759808421134949, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.383398" }, { "step": 6804, "loss": 0.6906737089157104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.478756" }, { "step": 6805, "loss": 0.8396468162536621, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.586736" }, { "step": 6806, "loss": 0.5500617027282715, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.680547" }, { "step": 6807, "loss": 0.9270985126495361, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.774039" }, { "step": 6808, "loss": 0.5355632305145264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.859179" }, { "step": 6809, "loss": 0.5666714906692505, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:53.956886" }, { "step": 6810, "loss": 0.6107279658317566, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.077186" }, { "step": 6811, "loss": 0.7544845938682556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.165075" }, { "step": 6812, "loss": 0.4071328043937683, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.254576" }, { "step": 6813, "loss": 0.9019603133201599, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.365747" }, { "step": 6814, "loss": 0.6158953905105591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.450276" }, { "step": 6815, "loss": 0.44585561752319336, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.546008" }, { "step": 6816, "loss": 0.6403480768203735, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.653756" }, { "step": 6817, "loss": 0.48908570408821106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.747905" }, { "step": 6818, "loss": 0.6508165597915649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.863058" }, { "step": 6819, "loss": 0.7739638090133667, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:54.972855" }, { "step": 6820, "loss": 1.0654033422470093, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.082338" }, { "step": 6821, "loss": 0.6946656703948975, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.206379" }, { "step": 6822, "loss": 0.6419346928596497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.292249" }, { "step": 6823, "loss": 0.6290754675865173, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.382801" }, { "step": 6824, "loss": 0.48165690898895264, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.500215" }, { "step": 6825, "loss": 0.5832440257072449, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.592959" }, { "step": 6826, "loss": 0.6928609609603882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.735112" }, { "step": 6827, "loss": 0.6064903736114502, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.821334" }, { "step": 6828, "loss": 0.7587820887565613, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:55.936918" }, { "step": 6829, "loss": 0.2910863757133484, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.024448" }, { "step": 6830, "loss": 0.5156704187393188, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.114341" }, { "step": 6831, "loss": 0.5100557208061218, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.243163" }, { "step": 6832, "loss": 0.5705949664115906, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.337368" }, { "step": 6833, "loss": 0.5414872765541077, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.434490" }, { "step": 6834, "loss": 0.6850973963737488, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.520888" }, { "step": 6835, "loss": 0.81004798412323, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.633342" }, { "step": 6836, "loss": 0.9643235206604004, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.729533" }, { "step": 6837, "loss": 0.20582804083824158, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.816080" }, { "step": 6838, "loss": 0.8050634264945984, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:56.909406" }, { "step": 6839, "loss": 0.9491873979568481, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.025461" }, { "step": 6840, "loss": 0.5056011080741882, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.121950" }, { "step": 6841, "loss": 0.6416477560997009, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.220663" }, { "step": 6842, "loss": 0.42013484239578247, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.315000" }, { "step": 6843, "loss": 0.6257138848304749, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.401807" }, { "step": 6844, "loss": 0.407673180103302, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.515585" }, { "step": 6845, "loss": 0.7012489438056946, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.609384" }, { "step": 6846, "loss": 0.6005015969276428, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.700566" }, { "step": 6847, "loss": 0.9138254523277283, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.787136" }, { "step": 6848, "loss": 0.5204735398292542, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.873211" }, { "step": 6849, "loss": 0.7199088335037231, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:57.968384" }, { "step": 6850, "loss": 0.8493281602859497, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.058262" }, { "step": 6851, "loss": 0.4551515579223633, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.155236" }, { "step": 6852, "loss": 0.9794679880142212, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.249362" }, { "step": 6853, "loss": 0.3764224648475647, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.335486" }, { "step": 6854, "loss": 0.99671471118927, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.448384" }, { "step": 6855, "loss": 0.35832345485687256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.544670" }, { "step": 6856, "loss": 0.5067753195762634, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.637330" }, { "step": 6857, "loss": 0.47209447622299194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.730884" }, { "step": 6858, "loss": 0.6024631261825562, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.831798" }, { "step": 6859, "loss": 0.6760612726211548, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:58.916062" }, { "step": 6860, "loss": 0.7265133857727051, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.001858" }, { "step": 6861, "loss": 0.6866716146469116, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.112008" }, { "step": 6862, "loss": 0.43341076374053955, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.205002" }, { "step": 6863, "loss": 0.47807592153549194, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.296814" }, { "step": 6864, "loss": 0.48095476627349854, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.402900" }, { "step": 6865, "loss": 0.5412392616271973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.499360" }, { "step": 6866, "loss": 0.7313829064369202, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.585497" }, { "step": 6867, "loss": 0.841423749923706, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.697498" }, { "step": 6868, "loss": 0.8717652559280396, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.808897" }, { "step": 6869, "loss": 0.42835482954978943, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:38:59.896510" }, { "step": 6870, "loss": 0.5093520879745483, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.014372" }, { "step": 6871, "loss": 0.7005118131637573, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.099199" }, { "step": 6872, "loss": 0.5348836779594421, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.189914" }, { "step": 6873, "loss": 0.9947587251663208, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.299623" }, { "step": 6874, "loss": 0.41653263568878174, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.393196" }, { "step": 6875, "loss": 0.437630295753479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.483988" }, { "step": 6876, "loss": 0.44259387254714966, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.572038" }, { "step": 6877, "loss": 0.23386317491531372, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.660288" }, { "step": 6878, "loss": 0.43437859416007996, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.752953" }, { "step": 6879, "loss": 0.6720832586288452, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.841299" }, { "step": 6880, "loss": 0.43835678696632385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:00.926098" }, { "step": 6881, "loss": 0.5749750733375549, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.019299" }, { "step": 6882, "loss": 0.6695635318756104, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.105400" }, { "step": 6883, "loss": 0.7261829376220703, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.210709" }, { "step": 6884, "loss": 0.6921046376228333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.304320" }, { "step": 6885, "loss": 0.5403764247894287, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.421707" }, { "step": 6886, "loss": 0.4782467484474182, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.512360" }, { "step": 6887, "loss": 0.712188720703125, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.600956" }, { "step": 6888, "loss": 0.9888303279876709, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.696697" }, { "step": 6889, "loss": 0.7189310789108276, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.814438" }, { "step": 6890, "loss": 0.6314557194709778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.901048" }, { "step": 6891, "loss": 0.45192089676856995, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:01.986558" }, { "step": 6892, "loss": 0.961949348449707, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.110551" }, { "step": 6893, "loss": 0.6637616157531738, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.210790" }, { "step": 6894, "loss": 0.783012330532074, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.319441" }, { "step": 6895, "loss": 0.6553168296813965, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.433796" }, { "step": 6896, "loss": 0.5242806077003479, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.520390" }, { "step": 6897, "loss": 0.4507027864456177, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.605000" }, { "step": 6898, "loss": 0.6536660194396973, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.723656" }, { "step": 6899, "loss": 0.4698128402233124, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.816274" }, { "step": 6900, "loss": 0.6222271919250488, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:02.911209" }, { "step": 6901, "loss": 0.5546128153800964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.003735" }, { "step": 6902, "loss": 0.8181421756744385, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.095612" }, { "step": 6903, "loss": 0.38301247358322144, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.188530" }, { "step": 6904, "loss": 0.5332808494567871, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.274842" }, { "step": 6905, "loss": 0.7438290119171143, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.386471" }, { "step": 6906, "loss": 0.8387271165847778, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.502460" }, { "step": 6907, "loss": 0.7787265181541443, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.626375" }, { "step": 6908, "loss": 0.7139887809753418, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.737022" }, { "step": 6909, "loss": 0.6195221543312073, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.820532" }, { "step": 6910, "loss": 0.7482712268829346, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.905949" }, { "step": 6911, "loss": 0.4392249584197998, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:03.999070" }, { "step": 6912, "loss": 0.5536802411079407, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.089358" }, { "step": 6913, "loss": 0.43277546763420105, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.179426" }, { "step": 6914, "loss": 0.5472291111946106, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.292927" }, { "step": 6915, "loss": 0.44490766525268555, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.378107" }, { "step": 6916, "loss": 0.8250951170921326, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.471807" }, { "step": 6917, "loss": 0.677784264087677, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.557158" }, { "step": 6918, "loss": 0.5644082427024841, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.642902" }, { "step": 6919, "loss": 0.8220864534378052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.750221" }, { "step": 6920, "loss": 0.7244866490364075, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.835855" }, { "step": 6921, "loss": 1.007920503616333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:04.921335" }, { "step": 6922, "loss": 0.5564972758293152, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.013053" }, { "step": 6923, "loss": 0.6958287954330444, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.098516" }, { "step": 6924, "loss": 0.6524324417114258, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.184837" }, { "step": 6925, "loss": 0.5092162489891052, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.279448" }, { "step": 6926, "loss": 0.7857630252838135, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.364558" }, { "step": 6927, "loss": 0.5559995174407959, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.453275" }, { "step": 6928, "loss": 0.602280855178833, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.569199" }, { "step": 6929, "loss": 0.9243791103363037, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.697739" }, { "step": 6930, "loss": 0.9297240972518921, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.792619" }, { "step": 6931, "loss": 0.8085651397705078, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.877321" }, { "step": 6932, "loss": 0.6292772889137268, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:05.966778" }, { "step": 6933, "loss": 0.6640976071357727, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.059509" }, { "step": 6934, "loss": 0.6500469446182251, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.144404" }, { "step": 6935, "loss": 0.46345585584640503, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.239898" }, { "step": 6936, "loss": 0.25332626700401306, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.325247" }, { "step": 6937, "loss": 0.3751096725463867, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.419904" }, { "step": 6938, "loss": 0.5771223306655884, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.508587" }, { "step": 6939, "loss": 0.5566922426223755, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.617603" }, { "step": 6940, "loss": 0.7247473001480103, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.734868" }, { "step": 6941, "loss": 0.48601388931274414, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.821610" }, { "step": 6942, "loss": 0.4496524930000305, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.913020" }, { "step": 6943, "loss": 0.5418603420257568, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:06.999586" }, { "step": 6944, "loss": 0.926906943321228, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.084719" }, { "step": 6945, "loss": 0.7740631103515625, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.171738" }, { "step": 6946, "loss": 0.9168674945831299, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.261973" }, { "step": 6947, "loss": 0.6573238372802734, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.379172" }, { "step": 6948, "loss": 0.8977750539779663, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.499577" }, { "step": 6949, "loss": 0.6804958581924438, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.590977" }, { "step": 6950, "loss": 0.6822401285171509, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.700134" }, { "step": 6951, "loss": 0.8548394441604614, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.807833" }, { "step": 6952, "loss": 0.5717246532440186, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.894599" }, { "step": 6953, "loss": 0.6103857159614563, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:07.989255" }, { "step": 6954, "loss": 0.7126290798187256, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.082017" }, { "step": 6955, "loss": 0.8495997190475464, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.197484" }, { "step": 6956, "loss": 0.5812974572181702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.283449" }, { "step": 6957, "loss": 0.5835901498794556, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.367690" }, { "step": 6958, "loss": 0.9904699325561523, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.482714" }, { "step": 6959, "loss": 0.6711432933807373, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.568299" }, { "step": 6960, "loss": 0.5488845705986023, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.654358" }, { "step": 6961, "loss": 0.6549355983734131, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.738935" }, { "step": 6962, "loss": 0.47686678171157837, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.831925" }, { "step": 6963, "loss": 0.40524905920028687, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:08.923755" }, { "step": 6964, "loss": 0.5194750428199768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.017103" }, { "step": 6965, "loss": 0.5016157627105713, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.104779" }, { "step": 6966, "loss": 0.7500213384628296, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.191891" }, { "step": 6967, "loss": 0.37444543838500977, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.287311" }, { "step": 6968, "loss": 0.4879606068134308, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.405169" }, { "step": 6969, "loss": 0.7835171222686768, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.501108" }, { "step": 6970, "loss": 0.6992994546890259, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.609084" }, { "step": 6971, "loss": 0.6032155156135559, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.709257" }, { "step": 6972, "loss": 0.7534776926040649, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.795467" }, { "step": 6973, "loss": 0.6982911825180054, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.880875" }, { "step": 6974, "loss": 0.5659118890762329, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:09.999851" }, { "step": 6975, "loss": 0.8804717063903809, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.093555" }, { "step": 6976, "loss": 0.6392108201980591, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.205046" }, { "step": 6977, "loss": 0.715478777885437, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.290756" }, { "step": 6978, "loss": 0.7723619937896729, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.410097" }, { "step": 6979, "loss": 0.6036839485168457, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.502378" }, { "step": 6980, "loss": 0.7092404961585999, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.588843" }, { "step": 6981, "loss": 0.6073147058486938, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.679448" }, { "step": 6982, "loss": 0.7599751353263855, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.797341" }, { "step": 6983, "loss": 0.8296031355857849, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.892221" }, { "step": 6984, "loss": 0.5406829714775085, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:10.978100" }, { "step": 6985, "loss": 0.7025588750839233, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.068020" }, { "step": 6986, "loss": 0.6267930269241333, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.153179" }, { "step": 6987, "loss": 0.65400230884552, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.265610" }, { "step": 6988, "loss": 0.30865371227264404, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.361577" }, { "step": 6989, "loss": 0.8727535009384155, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.474752" }, { "step": 6990, "loss": 0.46724432706832886, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.564622" }, { "step": 6991, "loss": 0.8466984033584595, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.684539" }, { "step": 6992, "loss": 0.5381495356559753, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.769154" }, { "step": 6993, "loss": 0.7211875915527344, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.862585" }, { "step": 6994, "loss": 0.8195438385009766, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:11.952530" }, { "step": 6995, "loss": 0.9256563186645508, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.066517" }, { "step": 6996, "loss": 0.7245627641677856, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.177834" }, { "step": 6997, "loss": 0.7383286356925964, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.263177" }, { "step": 6998, "loss": 0.6589103937149048, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.376471" }, { "step": 6999, "loss": 0.4397381842136383, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.468167" }, { "step": 7000, "loss": 0.6192573308944702, "learning_rate": 1e-05, "timestamp": "2025-08-18T20:39:12.568436" } ], "evaluation_history": [ { "step": 0, "checkpoint_type": "pre_training", "timestamp": "2025-08-18T20:22:59.760401", "loss": 1.2974295389652253, "perplexity": 3.659877061843872, "min_loss": 0.9512767791748047, "max_loss": 1.703115463256836, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.27680277119292407, "avg_word_accuracy": 0.11646049990689945, "avg_edit_distance": 33.17, "avg_normalized_edit_distance": 0.7231972288070756, "avg_length_ratio": 0.9951391574082407, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.034482758620689655, "edit_distance": 28, "normalized_edit_distance": 0.9655172413793104, "word_accuracy": 0.0, "length_ratio": 2.9, "predicted_length": 29, "ground_truth_length": 10 }, { "character_accuracy": 0.6226415094339622, "edit_distance": 20, "normalized_edit_distance": 0.37735849056603776, "word_accuracy": 0.25, "length_ratio": 0.7358490566037735, "predicted_length": 39, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 2, "ground_truth_length": 5 }, { "character_accuracy": 0.2803030303030303, "edit_distance": 95, "normalized_edit_distance": 0.7196969696969697, "word_accuracy": 0.13793103448275862, "length_ratio": 1.5348837209302326, "predicted_length": 132, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.34375, "edit_distance": 42, "normalized_edit_distance": 0.65625, "word_accuracy": 0.0, "length_ratio": 1.1636363636363636, "predicted_length": 64, "ground_truth_length": 55 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 15, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 2.5714285714285716, "predicted_length": 18, "ground_truth_length": 7 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.6190476190476191, "predicted_length": 26, "ground_truth_length": 42 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 19, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3684210526315789, "predicted_length": 7, "ground_truth_length": 19 }, { "character_accuracy": 0.058823529411764705, "edit_distance": 16, "normalized_edit_distance": 0.9411764705882353, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7435897435897436, "edit_distance": 10, "normalized_edit_distance": 0.2564102564102564, "word_accuracy": 0.4444444444444444, "length_ratio": 0.8461538461538461, "predicted_length": 33, "ground_truth_length": 39 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 18, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.4166666666666667, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.29545454545454547, "edit_distance": 31, "normalized_edit_distance": 0.7045454545454546, "word_accuracy": 0.1111111111111111, "length_ratio": 0.7045454545454546, "predicted_length": 31, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.18181818181818182, "predicted_length": 10, "ground_truth_length": 55 }, { "character_accuracy": 0.265625, "edit_distance": 47, "normalized_edit_distance": 0.734375, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 64, "ground_truth_length": 48 }, { "character_accuracy": 0.8867924528301887, "edit_distance": 6, "normalized_edit_distance": 0.11320754716981132, "word_accuracy": 0.5384615384615384, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.5405405405405406, "edit_distance": 17, "normalized_edit_distance": 0.4594594594594595, "word_accuracy": 0.2857142857142857, "length_ratio": 0.7027027027027027, "predicted_length": 26, "ground_truth_length": 37 }, { "character_accuracy": 0.0, "edit_distance": 58, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1896551724137931, "predicted_length": 11, "ground_truth_length": 58 }, { "character_accuracy": 0.045454545454545456, "edit_distance": 42, "normalized_edit_distance": 0.9545454545454546, "word_accuracy": 0.0, "length_ratio": 0.20454545454545456, "predicted_length": 9, "ground_truth_length": 44 }, { "character_accuracy": 0.030303030303030304, "edit_distance": 32, "normalized_edit_distance": 0.9696969696969697, "word_accuracy": 0.0, "length_ratio": 0.30303030303030304, "predicted_length": 10, "ground_truth_length": 33 }, { "character_accuracy": 0.20689655172413793, "edit_distance": 46, "normalized_edit_distance": 0.7931034482758621, "word_accuracy": 0.0, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5384615384615384, "edit_distance": 18, "normalized_edit_distance": 0.46153846153846156, "word_accuracy": 0.1111111111111111, "length_ratio": 0.717948717948718, "predicted_length": 28, "ground_truth_length": 39 }, { "character_accuracy": 0.23809523809523808, "edit_distance": 32, "normalized_edit_distance": 0.7619047619047619, "word_accuracy": 0.0, "length_ratio": 0.8095238095238095, "predicted_length": 34, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.872093023255814, "edit_distance": 11, "normalized_edit_distance": 0.12790697674418605, "word_accuracy": 0.6428571428571429, "length_ratio": 0.9418604651162791, "predicted_length": 81, "ground_truth_length": 86 }, { "character_accuracy": 0.7789473684210526, "edit_distance": 21, "normalized_edit_distance": 0.22105263157894736, "word_accuracy": 0.7333333333333333, "length_ratio": 0.8315789473684211, "predicted_length": 79, "ground_truth_length": 95 }, { "character_accuracy": 0.8974358974358975, "edit_distance": 4, "normalized_edit_distance": 0.10256410256410256, "word_accuracy": 0.75, "length_ratio": 0.8974358974358975, "predicted_length": 35, "ground_truth_length": 39 }, { "character_accuracy": 0.26804123711340205, "edit_distance": 71, "normalized_edit_distance": 0.7319587628865979, "word_accuracy": 0.0, "length_ratio": 1.4264705882352942, "predicted_length": 97, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.0, "edit_distance": 14, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.21428571428571427, "predicted_length": 3, "ground_truth_length": 14 }, { "character_accuracy": 0.1702127659574468, "edit_distance": 39, "normalized_edit_distance": 0.8297872340425532, "word_accuracy": 0.0, "length_ratio": 1.46875, "predicted_length": 47, "ground_truth_length": 32 }, { "character_accuracy": 0.1702127659574468, "edit_distance": 39, "normalized_edit_distance": 0.8297872340425532, "word_accuracy": 0.0, "length_ratio": 0.8297872340425532, "predicted_length": 39, "ground_truth_length": 47 }, { "character_accuracy": 0.234375, "edit_distance": 49, "normalized_edit_distance": 0.765625, "word_accuracy": 0.058823529411764705, "length_ratio": 1.3061224489795917, "predicted_length": 64, "ground_truth_length": 49 }, { "character_accuracy": 0.20967741935483872, "edit_distance": 147, "normalized_edit_distance": 0.7903225806451613, "word_accuracy": 0.0, "length_ratio": 1.9578947368421054, "predicted_length": 186, "ground_truth_length": 95 }, { "character_accuracy": 0.20207253886010362, "edit_distance": 154, "normalized_edit_distance": 0.7979274611398963, "word_accuracy": 0.0, "length_ratio": 1.969387755102041, "predicted_length": 193, "ground_truth_length": 98 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 6, "ground_truth_length": 10 }, { "character_accuracy": 0.4024390243902439, "edit_distance": 49, "normalized_edit_distance": 0.5975609756097561, "word_accuracy": 0.0625, "length_ratio": 0.9634146341463414, "predicted_length": 79, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.1956521739130435, "edit_distance": 37, "normalized_edit_distance": 0.8043478260869565, "word_accuracy": 0.0, "length_ratio": 2.090909090909091, "predicted_length": 46, "ground_truth_length": 22 }, { "character_accuracy": 0.19444444444444445, "edit_distance": 29, "normalized_edit_distance": 0.8055555555555556, "word_accuracy": 0.0, "length_ratio": 0.4722222222222222, "predicted_length": 17, "ground_truth_length": 36 }, { "character_accuracy": 0.7954545454545454, "edit_distance": 9, "normalized_edit_distance": 0.20454545454545456, "word_accuracy": 0.5555555555555556, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.4375, "edit_distance": 36, "normalized_edit_distance": 0.5625, "word_accuracy": 0.0, "length_ratio": 0.96875, "predicted_length": 62, "ground_truth_length": 64 }, { "character_accuracy": 0.23469387755102042, "edit_distance": 150, "normalized_edit_distance": 0.7653061224489796, "word_accuracy": 0.0, "length_ratio": 2.0631578947368423, "predicted_length": 196, "ground_truth_length": 95 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.125, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.13793103448275862, "edit_distance": 50, "normalized_edit_distance": 0.8620689655172413, "word_accuracy": 0.0, "length_ratio": 0.9655172413793104, "predicted_length": 56, "ground_truth_length": 58 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 38, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5681818181818182, "predicted_length": 25, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.72, "edit_distance": 14, "normalized_edit_distance": 0.28, "word_accuracy": 0.6, "length_ratio": 0.84, "predicted_length": 42, "ground_truth_length": 50 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 12, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.2857142857142857, "length_ratio": 0.7941176470588235, "predicted_length": 27, "ground_truth_length": 34 }, { "character_accuracy": 0.0, "edit_distance": 60, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.23333333333333334, "predicted_length": 14, "ground_truth_length": 60 }, { "character_accuracy": 0.23076923076923078, "edit_distance": 70, "normalized_edit_distance": 0.7692307692307693, "word_accuracy": 0.0, "length_ratio": 1.6851851851851851, "predicted_length": 91, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 13, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 2.6, "predicted_length": 13, "ground_truth_length": 5 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 4, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.2561576354679803, "edit_distance": 151, "normalized_edit_distance": 0.7438423645320197, "word_accuracy": 0.0, "length_ratio": 2.0927835051546393, "predicted_length": 203, "ground_truth_length": 97 }, { "character_accuracy": 0.12244897959183673, "edit_distance": 43, "normalized_edit_distance": 0.8775510204081632, "word_accuracy": 0.0, "length_ratio": 4.454545454545454, "predicted_length": 49, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.0, "length_ratio": 1.6818181818181819, "predicted_length": 37, "ground_truth_length": 22 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.23636363636363636, "predicted_length": 13, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 4, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 6, "ground_truth_length": 6 }, { "character_accuracy": 0.26666666666666666, "edit_distance": 11, "normalized_edit_distance": 0.7333333333333333, "word_accuracy": 0.0, "length_ratio": 0.5333333333333333, "predicted_length": 8, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2909090909090909, "predicted_length": 16, "ground_truth_length": 55 }, { "character_accuracy": 0.03125, "edit_distance": 31, "normalized_edit_distance": 0.96875, "word_accuracy": 0.0, "length_ratio": 6.4, "predicted_length": 32, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.11538461538461539, "edit_distance": 46, "normalized_edit_distance": 0.8846153846153846, "word_accuracy": 0.0, "length_ratio": 1.0833333333333333, "predicted_length": 52, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.2602739726027397, "edit_distance": 54, "normalized_edit_distance": 0.7397260273972602, "word_accuracy": 0.0, "length_ratio": 1.6222222222222222, "predicted_length": 73, "ground_truth_length": 45 }, { "character_accuracy": 0.24444444444444444, "edit_distance": 68, "normalized_edit_distance": 0.7555555555555555, "word_accuracy": 0.0, "length_ratio": 1.8, "predicted_length": 90, "ground_truth_length": 50 }, { "character_accuracy": 0.2857142857142857, "edit_distance": 5, "normalized_edit_distance": 0.7142857142857143, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.22123893805309736, "edit_distance": 88, "normalized_edit_distance": 0.7787610619469026, "word_accuracy": 0.0, "length_ratio": 1.2417582417582418, "predicted_length": 113, "ground_truth_length": 91 }, { "character_accuracy": 0.1724137931034483, "edit_distance": 24, "normalized_edit_distance": 0.8275862068965517, "word_accuracy": 0.0, "length_ratio": 1.7058823529411764, "predicted_length": 29, "ground_truth_length": 17 }, { "character_accuracy": 0.65, "edit_distance": 14, "normalized_edit_distance": 0.35, "word_accuracy": 0.5714285714285714, "length_ratio": 0.675, "predicted_length": 27, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 4, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 4, "ground_truth_length": 3 }, { "character_accuracy": 0.2346368715083799, "edit_distance": 137, "normalized_edit_distance": 0.7653631284916201, "word_accuracy": 0.0, "length_ratio": 1.7211538461538463, "predicted_length": 179, "ground_truth_length": 104 }, { "character_accuracy": 0.22839506172839505, "edit_distance": 125, "normalized_edit_distance": 0.7716049382716049, "word_accuracy": 0.0, "length_ratio": 1.6875, "predicted_length": 162, "ground_truth_length": 96 }, { "character_accuracy": 0.47619047619047616, "edit_distance": 22, "normalized_edit_distance": 0.5238095238095238, "word_accuracy": 0.15384615384615385, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 44, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 10, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 26, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3076923076923077, "predicted_length": 8, "ground_truth_length": 26 }, { "character_accuracy": 0.16, "edit_distance": 21, "normalized_edit_distance": 0.84, "word_accuracy": 0.0, "length_ratio": 1.5625, "predicted_length": 25, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.6440677966101694, "edit_distance": 21, "normalized_edit_distance": 0.3559322033898305, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6949152542372882, "predicted_length": 41, "ground_truth_length": 59 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.5151515151515151, "predicted_length": 17, "ground_truth_length": 33 }, { "character_accuracy": 0.23636363636363636, "edit_distance": 42, "normalized_edit_distance": 0.7636363636363637, "word_accuracy": 0.05555555555555555, "length_ratio": 1.0377358490566038, "predicted_length": 55, "ground_truth_length": 53 }, { "character_accuracy": 0.8688524590163934, "edit_distance": 8, "normalized_edit_distance": 0.13114754098360656, "word_accuracy": 0.6, "length_ratio": 0.9672131147540983, "predicted_length": 59, "ground_truth_length": 61 } ] }, { "step": 500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:24:07.146625", "loss": 0.9453990042209626, "perplexity": 2.5738401412963867, "min_loss": 0.5728509426116943, "max_loss": 1.5241628885269165, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.3944614812685853, "avg_word_accuracy": 0.19857796220663862, "avg_edit_distance": 23.71, "avg_normalized_edit_distance": 0.6055385187314148, "avg_length_ratio": 0.7605503585194653, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.5, "edit_distance": 5, "normalized_edit_distance": 0.5, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.2830188679245283, "edit_distance": 38, "normalized_edit_distance": 0.7169811320754716, "word_accuracy": 0.0, "length_ratio": 0.7169811320754716, "predicted_length": 38, "ground_truth_length": 53 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.29292929292929293, "edit_distance": 70, "normalized_edit_distance": 0.7070707070707071, "word_accuracy": 0.037037037037037035, "length_ratio": 1.1511627906976745, "predicted_length": 99, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.5, "length_ratio": 0.8545454545454545, "predicted_length": 47, "ground_truth_length": 55 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 14, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.14285714285714285, "length_ratio": 0.7619047619047619, "predicted_length": 32, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.25, "edit_distance": 15, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.0526315789473684, "predicted_length": 20, "ground_truth_length": 19 }, { "character_accuracy": 0.058823529411764705, "edit_distance": 16, "normalized_edit_distance": 0.9411764705882353, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 18, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.6, "length_ratio": 0.7450980392156863, "predicted_length": 38, "ground_truth_length": 51 }, { "character_accuracy": 0.4090909090909091, "edit_distance": 26, "normalized_edit_distance": 0.5909090909090909, "word_accuracy": 0.1111111111111111, "length_ratio": 0.6136363636363636, "predicted_length": 27, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.3, "edit_distance": 7, "normalized_edit_distance": 0.7, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.3541666666666667, "edit_distance": 31, "normalized_edit_distance": 0.6458333333333334, "word_accuracy": 0.4, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.24324324324324326, "edit_distance": 28, "normalized_edit_distance": 0.7567567567567568, "word_accuracy": 0.25, "length_ratio": 0.7837837837837838, "predicted_length": 29, "ground_truth_length": 37 }, { "character_accuracy": 0.6896551724137931, "edit_distance": 18, "normalized_edit_distance": 0.3103448275862069, "word_accuracy": 0.25, "length_ratio": 0.8448275862068966, "predicted_length": 49, "ground_truth_length": 58 }, { "character_accuracy": 0.4090909090909091, "edit_distance": 26, "normalized_edit_distance": 0.5909090909090909, "word_accuracy": 0.1111111111111111, "length_ratio": 0.5227272727272727, "predicted_length": 23, "ground_truth_length": 44 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 6, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.1, "length_ratio": 0.8787878787878788, "predicted_length": 29, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.8125, "edit_distance": 9, "normalized_edit_distance": 0.1875, "word_accuracy": 0.375, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.38461538461538464, "edit_distance": 24, "normalized_edit_distance": 0.6153846153846154, "word_accuracy": 0.0, "length_ratio": 0.5384615384615384, "predicted_length": 21, "ground_truth_length": 39 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.40476190476190477, "predicted_length": 17, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.281767955801105, "edit_distance": 130, "normalized_edit_distance": 0.7182320441988951, "word_accuracy": 0.05128205128205128, "length_ratio": 2.104651162790698, "predicted_length": 181, "ground_truth_length": 86 }, { "character_accuracy": 0.3473684210526316, "edit_distance": 62, "normalized_edit_distance": 0.6526315789473685, "word_accuracy": 0.4117647058823529, "length_ratio": 0.9263157894736842, "predicted_length": 88, "ground_truth_length": 95 }, { "character_accuracy": 0.5128205128205128, "edit_distance": 19, "normalized_edit_distance": 0.48717948717948717, "word_accuracy": 0.3, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 12, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 7, "ground_truth_length": 14 }, { "character_accuracy": 0.22857142857142856, "edit_distance": 27, "normalized_edit_distance": 0.7714285714285715, "word_accuracy": 0.0, "length_ratio": 1.09375, "predicted_length": 35, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8979591836734694, "edit_distance": 5, "normalized_edit_distance": 0.10204081632653061, "word_accuracy": 0.6, "length_ratio": 1.0, "predicted_length": 49, "ground_truth_length": 49 }, { "character_accuracy": 0.9157894736842105, "edit_distance": 8, "normalized_edit_distance": 0.08421052631578947, "word_accuracy": 0.7857142857142857, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.16326530612244897, "edit_distance": 82, "normalized_edit_distance": 0.8367346938775511, "word_accuracy": 0.0, "length_ratio": 0.9897959183673469, "predicted_length": 97, "ground_truth_length": 98 }, { "character_accuracy": 0.4, "edit_distance": 6, "normalized_edit_distance": 0.6, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1, "edit_distance": 18, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 6, "ground_truth_length": 20 }, { "character_accuracy": 0.23529411764705882, "edit_distance": 26, "normalized_edit_distance": 0.7647058823529411, "word_accuracy": 0.07692307692307693, "length_ratio": 1.5454545454545454, "predicted_length": 34, "ground_truth_length": 22 }, { "character_accuracy": 0.05555555555555555, "edit_distance": 34, "normalized_edit_distance": 0.9444444444444444, "word_accuracy": 0.0, "length_ratio": 0.2222222222222222, "predicted_length": 8, "ground_truth_length": 36 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5555555555555556, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.65625, "edit_distance": 22, "normalized_edit_distance": 0.34375, "word_accuracy": 0.5, "length_ratio": 0.71875, "predicted_length": 46, "ground_truth_length": 64 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 75, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 95, "ground_truth_length": 95 }, { "character_accuracy": 0.2702702702702703, "edit_distance": 27, "normalized_edit_distance": 0.7297297297297297, "word_accuracy": 0.14285714285714285, "length_ratio": 0.5405405405405406, "predicted_length": 20, "ground_truth_length": 37 }, { "character_accuracy": 0.5517241379310345, "edit_distance": 26, "normalized_edit_distance": 0.4482758620689655, "word_accuracy": 0.375, "length_ratio": 0.7241379310344828, "predicted_length": 42, "ground_truth_length": 58 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 38, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5681818181818182, "predicted_length": 25, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.72, "edit_distance": 14, "normalized_edit_distance": 0.28, "word_accuracy": 0.6, "length_ratio": 0.84, "predicted_length": 42, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.42857142857142855, "length_ratio": 0.7941176470588235, "predicted_length": 27, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 6, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.7272727272727273, "length_ratio": 0.9629629629629629, "predicted_length": 52, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 5, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.3, "edit_distance": 14, "normalized_edit_distance": 0.7, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 12, "ground_truth_length": 20 }, { "character_accuracy": 0.2571428571428571, "edit_distance": 156, "normalized_edit_distance": 0.7428571428571429, "word_accuracy": 0.0, "length_ratio": 2.1649484536082473, "predicted_length": 210, "ground_truth_length": 97 }, { "character_accuracy": 0.36363636363636365, "edit_distance": 7, "normalized_edit_distance": 0.6363636363636364, "word_accuracy": 0.0, "length_ratio": 0.8181818181818182, "predicted_length": 9, "ground_truth_length": 11 }, { "character_accuracy": 0.22580645161290322, "edit_distance": 96, "normalized_edit_distance": 0.7741935483870968, "word_accuracy": 0.2, "length_ratio": 1.2783505154639174, "predicted_length": 124, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.16666666666666666, "length_ratio": 0.5909090909090909, "predicted_length": 13, "ground_truth_length": 22 }, { "character_accuracy": 0.6545454545454545, "edit_distance": 19, "normalized_edit_distance": 0.34545454545454546, "word_accuracy": 0.5454545454545454, "length_ratio": 0.8545454545454545, "predicted_length": 47, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.26666666666666666, "edit_distance": 11, "normalized_edit_distance": 0.7333333333333333, "word_accuracy": 0.0, "length_ratio": 0.5333333333333333, "predicted_length": 8, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.38181818181818183, "edit_distance": 34, "normalized_edit_distance": 0.6181818181818182, "word_accuracy": 0.0, "length_ratio": 0.7090909090909091, "predicted_length": 39, "ground_truth_length": 55 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.20833333333333334, "edit_distance": 152, "normalized_edit_distance": 0.7916666666666666, "word_accuracy": 0.0, "length_ratio": 1.7142857142857142, "predicted_length": 192, "ground_truth_length": 112 }, { "character_accuracy": 0.4166666666666667, "edit_distance": 28, "normalized_edit_distance": 0.5833333333333334, "word_accuracy": 0.2222222222222222, "length_ratio": 0.625, "predicted_length": 30, "ground_truth_length": 48 }, { "character_accuracy": 0.25, "edit_distance": 12, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.7333333333333333, "edit_distance": 12, "normalized_edit_distance": 0.26666666666666666, "word_accuracy": 0.36363636363636365, "length_ratio": 0.9111111111111111, "predicted_length": 41, "ground_truth_length": 45 }, { "character_accuracy": 0.9, "edit_distance": 5, "normalized_edit_distance": 0.1, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.22424242424242424, "edit_distance": 128, "normalized_edit_distance": 0.7757575757575758, "word_accuracy": 0.03125, "length_ratio": 1.8131868131868132, "predicted_length": 165, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.4117647058823529, "predicted_length": 7, "ground_truth_length": 17 }, { "character_accuracy": 0.15, "edit_distance": 34, "normalized_edit_distance": 0.85, "word_accuracy": 0.0, "length_ratio": 0.425, "predicted_length": 17, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 3, "ground_truth_length": 3 }, { "character_accuracy": 0.417910447761194, "edit_distance": 78, "normalized_edit_distance": 0.582089552238806, "word_accuracy": 0.16666666666666666, "length_ratio": 1.2884615384615385, "predicted_length": 134, "ground_truth_length": 104 }, { "character_accuracy": 0.1782178217821782, "edit_distance": 83, "normalized_edit_distance": 0.8217821782178217, "word_accuracy": 0.0, "length_ratio": 1.0520833333333333, "predicted_length": 101, "ground_truth_length": 96 }, { "character_accuracy": 0.8809523809523809, "edit_distance": 5, "normalized_edit_distance": 0.11904761904761904, "word_accuracy": 0.7, "length_ratio": 0.9761904761904762, "predicted_length": 41, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 8, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.14285714285714285, "length_ratio": 1.0769230769230769, "predicted_length": 28, "ground_truth_length": 26 }, { "character_accuracy": 0.0625, "edit_distance": 15, "normalized_edit_distance": 0.9375, "word_accuracy": 0.0, "length_ratio": 0.375, "predicted_length": 6, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.6440677966101694, "edit_distance": 21, "normalized_edit_distance": 0.3559322033898305, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6949152542372882, "predicted_length": 41, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 22, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.2222222222222222, "length_ratio": 0.7878787878787878, "predicted_length": 26, "ground_truth_length": 33 }, { "character_accuracy": 0.11320754716981132, "edit_distance": 47, "normalized_edit_distance": 0.8867924528301887, "word_accuracy": 0.0, "length_ratio": 0.3584905660377358, "predicted_length": 19, "ground_truth_length": 53 }, { "character_accuracy": 0.7868852459016393, "edit_distance": 13, "normalized_edit_distance": 0.21311475409836064, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 1000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:25:18.508488", "loss": 0.8644448637962341, "perplexity": 2.373687982559204, "min_loss": 0.4200422167778015, "max_loss": 1.4333516359329224, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.38742342612535147, "avg_word_accuracy": 0.19101810389729262, "avg_edit_distance": 24.04040404040404, "avg_normalized_edit_distance": 0.6125765738746487, "avg_length_ratio": 0.7450831340507312, "text_samples_evaluated": 99, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.3018867924528302, "edit_distance": 37, "normalized_edit_distance": 0.6981132075471698, "word_accuracy": 0.0, "length_ratio": 0.5283018867924528, "predicted_length": 28, "ground_truth_length": 53 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.8953488372093024, "edit_distance": 9, "normalized_edit_distance": 0.10465116279069768, "word_accuracy": 0.8571428571428571, "length_ratio": 0.9069767441860465, "predicted_length": 78, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.509090909090909, "edit_distance": 27, "normalized_edit_distance": 0.4909090909090909, "word_accuracy": 0.0, "length_ratio": 0.7454545454545455, "predicted_length": 41, "ground_truth_length": 55 }, { "character_accuracy": 0.5714285714285714, "edit_distance": 3, "normalized_edit_distance": 0.42857142857142855, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 7, "ground_truth_length": 7 }, { "character_accuracy": 0.5, "edit_distance": 21, "normalized_edit_distance": 0.5, "word_accuracy": 0.0, "length_ratio": 0.7380952380952381, "predicted_length": 31, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.30434782608695654, "edit_distance": 16, "normalized_edit_distance": 0.6956521739130435, "word_accuracy": 0.0, "length_ratio": 1.2105263157894737, "predicted_length": 23, "ground_truth_length": 19 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.6862745098039216, "edit_distance": 16, "normalized_edit_distance": 0.3137254901960784, "word_accuracy": 0.5, "length_ratio": 0.803921568627451, "predicted_length": 41, "ground_truth_length": 51 }, { "character_accuracy": 0.20454545454545456, "edit_distance": 35, "normalized_edit_distance": 0.7954545454545454, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 20, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.3, "edit_distance": 7, "normalized_edit_distance": 0.7, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.2916666666666667, "edit_distance": 34, "normalized_edit_distance": 0.7083333333333334, "word_accuracy": 0.09090909090909091, "length_ratio": 0.4583333333333333, "predicted_length": 22, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.3783783783783784, "edit_distance": 23, "normalized_edit_distance": 0.6216216216216216, "word_accuracy": 0.25, "length_ratio": 0.7567567567567568, "predicted_length": 28, "ground_truth_length": 37 }, { "character_accuracy": 0.6896551724137931, "edit_distance": 18, "normalized_edit_distance": 0.3103448275862069, "word_accuracy": 0.16666666666666666, "length_ratio": 0.8448275862068966, "predicted_length": 49, "ground_truth_length": 58 }, { "character_accuracy": 0.6136363636363636, "edit_distance": 17, "normalized_edit_distance": 0.38636363636363635, "word_accuracy": 0.1, "length_ratio": 0.7727272727272727, "predicted_length": 34, "ground_truth_length": 44 }, { "character_accuracy": 0.21212121212121213, "edit_distance": 26, "normalized_edit_distance": 0.7878787878787878, "word_accuracy": 0.0, "length_ratio": 0.5151515151515151, "predicted_length": 17, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.2, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.5714285714285714, "length_ratio": 0.8205128205128205, "predicted_length": 32, "ground_truth_length": 39 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.38095238095238093, "predicted_length": 16, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.3979591836734694, "edit_distance": 59, "normalized_edit_distance": 0.6020408163265306, "word_accuracy": 0.21739130434782608, "length_ratio": 1.1395348837209303, "predicted_length": 98, "ground_truth_length": 86 }, { "character_accuracy": 0.3473684210526316, "edit_distance": 62, "normalized_edit_distance": 0.6526315789473685, "word_accuracy": 0.4117647058823529, "length_ratio": 0.9263157894736842, "predicted_length": 88, "ground_truth_length": 95 }, { "character_accuracy": 0.48717948717948717, "edit_distance": 20, "normalized_edit_distance": 0.5128205128205128, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.21428571428571427, "edit_distance": 11, "normalized_edit_distance": 0.7857142857142857, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 6, "ground_truth_length": 14 }, { "character_accuracy": 0.25, "edit_distance": 30, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.25, "predicted_length": 40, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8775510204081632, "edit_distance": 6, "normalized_edit_distance": 0.12244897959183673, "word_accuracy": 0.5, "length_ratio": 0.9387755102040817, "predicted_length": 46, "ground_truth_length": 49 }, { "character_accuracy": 0.9157894736842105, "edit_distance": 8, "normalized_edit_distance": 0.08421052631578947, "word_accuracy": 0.7857142857142857, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.25510204081632654, "edit_distance": 73, "normalized_edit_distance": 0.7448979591836735, "word_accuracy": 0.0, "length_ratio": 0.8061224489795918, "predicted_length": 79, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.2, "edit_distance": 16, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 10, "ground_truth_length": 20 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.07692307692307693, "length_ratio": 1.6818181818181819, "predicted_length": 37, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.2222222222222222, "predicted_length": 8, "ground_truth_length": 36 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5555555555555556, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.9375, "edit_distance": 4, "normalized_edit_distance": 0.0625, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 64, "ground_truth_length": 64 }, { "character_accuracy": 0.29906542056074764, "edit_distance": 75, "normalized_edit_distance": 0.7009345794392523, "word_accuracy": 0.041666666666666664, "length_ratio": 1.1263157894736842, "predicted_length": 107, "ground_truth_length": 95 }, { "character_accuracy": 0.16216216216216217, "edit_distance": 31, "normalized_edit_distance": 0.8378378378378378, "word_accuracy": 0.0, "length_ratio": 0.5405405405405406, "predicted_length": 20, "ground_truth_length": 37 }, { "character_accuracy": 0.29310344827586204, "edit_distance": 41, "normalized_edit_distance": 0.7068965517241379, "word_accuracy": 0.0, "length_ratio": 0.6551724137931034, "predicted_length": 38, "ground_truth_length": 58 }, { "character_accuracy": 0.5681818181818182, "edit_distance": 19, "normalized_edit_distance": 0.4318181818181818, "word_accuracy": 0.0, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 12, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.2222222222222222, "length_ratio": 0.9117647058823529, "predicted_length": 31, "ground_truth_length": 34 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 40, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.0, "length_ratio": 0.5166666666666667, "predicted_length": 31, "ground_truth_length": 60 }, { "character_accuracy": 0.8333333333333334, "edit_distance": 9, "normalized_edit_distance": 0.16666666666666666, "word_accuracy": 0.46153846153846156, "length_ratio": 0.9259259259259259, "predicted_length": 50, "ground_truth_length": 54 }, { "character_accuracy": 1.0, "edit_distance": 0, "normalized_edit_distance": 0.0, "word_accuracy": 1.0, "length_ratio": 1.0, "predicted_length": 5, "ground_truth_length": 5 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 5, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 3, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.6363636363636364, "predicted_length": 7, "ground_truth_length": 11 }, { "character_accuracy": 0.2283464566929134, "edit_distance": 98, "normalized_edit_distance": 0.7716535433070866, "word_accuracy": 0.2413793103448276, "length_ratio": 1.309278350515464, "predicted_length": 127, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 20, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 7, "ground_truth_length": 22 }, { "character_accuracy": 0.2711864406779661, "edit_distance": 43, "normalized_edit_distance": 0.7288135593220338, "word_accuracy": 0.0, "length_ratio": 1.0727272727272728, "predicted_length": 59, "ground_truth_length": 55 }, { "character_accuracy": 0.125, "edit_distance": 7, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.375, "predicted_length": 3, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.4, "edit_distance": 9, "normalized_edit_distance": 0.6, "word_accuracy": 0.25, "length_ratio": 0.7333333333333333, "predicted_length": 11, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7272727272727273, "edit_distance": 15, "normalized_edit_distance": 0.2727272727272727, "word_accuracy": 0.5, "length_ratio": 0.9272727272727272, "predicted_length": 51, "ground_truth_length": 55 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 100, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 1.0714285714285714, "predicted_length": 120, "ground_truth_length": 112 }, { "character_accuracy": 0.4166666666666667, "edit_distance": 28, "normalized_edit_distance": 0.5833333333333334, "word_accuracy": 0.1, "length_ratio": 0.9375, "predicted_length": 45, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.8, "edit_distance": 9, "normalized_edit_distance": 0.2, "word_accuracy": 0.6, "length_ratio": 0.9555555555555556, "predicted_length": 43, "ground_truth_length": 45 }, { "character_accuracy": 0.0, "edit_distance": 50, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16, "predicted_length": 8, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.3, "edit_distance": 91, "normalized_edit_distance": 0.7, "word_accuracy": 0.2, "length_ratio": 1.4285714285714286, "predicted_length": 130, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.4117647058823529, "predicted_length": 7, "ground_truth_length": 17 }, { "character_accuracy": 0.125, "edit_distance": 35, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.2315270935960591, "edit_distance": 156, "normalized_edit_distance": 0.7684729064039408, "word_accuracy": 0.0, "length_ratio": 1.9519230769230769, "predicted_length": 203, "ground_truth_length": 104 }, { "character_accuracy": 0.23668639053254437, "edit_distance": 129, "normalized_edit_distance": 0.7633136094674556, "word_accuracy": 0.0, "length_ratio": 1.7604166666666667, "predicted_length": 169, "ground_truth_length": 96 }, { "character_accuracy": 1.0, "edit_distance": 0, "normalized_edit_distance": 0.0, "word_accuracy": 1.0, "length_ratio": 1.0, "predicted_length": 42, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.34615384615384615, "edit_distance": 17, "normalized_edit_distance": 0.6538461538461539, "word_accuracy": 0.16666666666666666, "length_ratio": 0.7307692307692307, "predicted_length": 19, "ground_truth_length": 26 }, { "character_accuracy": 0.0625, "edit_distance": 15, "normalized_edit_distance": 0.9375, "word_accuracy": 0.0, "length_ratio": 0.375, "predicted_length": 6, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.4576271186440678, "edit_distance": 32, "normalized_edit_distance": 0.5423728813559322, "word_accuracy": 0.25, "length_ratio": 0.6440677966101694, "predicted_length": 38, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.7575757575757576, "predicted_length": 25, "ground_truth_length": 33 }, { "character_accuracy": 0.24528301886792453, "edit_distance": 40, "normalized_edit_distance": 0.7547169811320755, "word_accuracy": 0.18181818181818182, "length_ratio": 0.6415094339622641, "predicted_length": 34, "ground_truth_length": 53 }, { "character_accuracy": 0.7868852459016393, "edit_distance": 13, "normalized_edit_distance": 0.21311475409836064, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 1500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:26:29.665421", "loss": 0.8401906085014343, "perplexity": 2.3168084621429443, "min_loss": 0.40070778131484985, "max_loss": 1.435326337814331, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.38384316369419, "avg_word_accuracy": 0.1888865697104828, "avg_edit_distance": 23.43, "avg_normalized_edit_distance": 0.6161568363058101, "avg_length_ratio": 0.761705968699557, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.8, "edit_distance": 2, "normalized_edit_distance": 0.2, "word_accuracy": 0.3333333333333333, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.23636363636363636, "edit_distance": 42, "normalized_edit_distance": 0.7636363636363637, "word_accuracy": 0.0, "length_ratio": 1.0377358490566038, "predicted_length": 55, "ground_truth_length": 53 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.46511627906976744, "edit_distance": 46, "normalized_edit_distance": 0.5348837209302325, "word_accuracy": 0.5714285714285714, "length_ratio": 0.813953488372093, "predicted_length": 70, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.0, "length_ratio": 0.4727272727272727, "predicted_length": 26, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.5, "edit_distance": 21, "normalized_edit_distance": 0.5, "word_accuracy": 0.0, "length_ratio": 0.7380952380952381, "predicted_length": 31, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.3684210526315789, "edit_distance": 12, "normalized_edit_distance": 0.631578947368421, "word_accuracy": 0.0, "length_ratio": 0.8947368421052632, "predicted_length": 17, "ground_truth_length": 19 }, { "character_accuracy": 0.5555555555555556, "edit_distance": 8, "normalized_edit_distance": 0.4444444444444444, "word_accuracy": 0.2, "length_ratio": 1.0588235294117647, "predicted_length": 18, "ground_truth_length": 17 }, { "character_accuracy": 0.7435897435897436, "edit_distance": 10, "normalized_edit_distance": 0.2564102564102564, "word_accuracy": 0.4444444444444444, "length_ratio": 0.8461538461538461, "predicted_length": 33, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.6862745098039216, "edit_distance": 16, "normalized_edit_distance": 0.3137254901960784, "word_accuracy": 0.5, "length_ratio": 0.803921568627451, "predicted_length": 41, "ground_truth_length": 51 }, { "character_accuracy": 0.20454545454545456, "edit_distance": 35, "normalized_edit_distance": 0.7954545454545454, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 20, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.3541666666666667, "edit_distance": 31, "normalized_edit_distance": 0.6458333333333334, "word_accuracy": 0.4, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.8301886792452831, "edit_distance": 9, "normalized_edit_distance": 0.16981132075471697, "word_accuracy": 0.7272727272727273, "length_ratio": 0.9433962264150944, "predicted_length": 50, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 40, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 1.3513513513513513, "predicted_length": 50, "ground_truth_length": 37 }, { "character_accuracy": 0.3793103448275862, "edit_distance": 36, "normalized_edit_distance": 0.6206896551724138, "word_accuracy": 0.0, "length_ratio": 0.7413793103448276, "predicted_length": 43, "ground_truth_length": 58 }, { "character_accuracy": 0.022727272727272728, "edit_distance": 43, "normalized_edit_distance": 0.9772727272727273, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 10, "ground_truth_length": 44 }, { "character_accuracy": 0.7575757575757576, "edit_distance": 8, "normalized_edit_distance": 0.24242424242424243, "word_accuracy": 0.1111111111111111, "length_ratio": 0.8484848484848485, "predicted_length": 28, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.8125, "edit_distance": 9, "normalized_edit_distance": 0.1875, "word_accuracy": 0.375, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.6410256410256411, "edit_distance": 14, "normalized_edit_distance": 0.358974358974359, "word_accuracy": 0.3333333333333333, "length_ratio": 0.9230769230769231, "predicted_length": 36, "ground_truth_length": 39 }, { "character_accuracy": 0.23809523809523808, "edit_distance": 32, "normalized_edit_distance": 0.7619047619047619, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.21301775147928995, "edit_distance": 133, "normalized_edit_distance": 0.7869822485207101, "word_accuracy": 0.0, "length_ratio": 1.9651162790697674, "predicted_length": 169, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 21, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.07142857142857142, "edit_distance": 13, "normalized_edit_distance": 0.9285714285714286, "word_accuracy": 0.0, "length_ratio": 0.35714285714285715, "predicted_length": 5, "ground_truth_length": 14 }, { "character_accuracy": 0.2549019607843137, "edit_distance": 38, "normalized_edit_distance": 0.7450980392156863, "word_accuracy": 0.0, "length_ratio": 1.59375, "predicted_length": 51, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.9387755102040817, "edit_distance": 3, "normalized_edit_distance": 0.061224489795918366, "word_accuracy": 0.6, "length_ratio": 1.0, "predicted_length": 49, "ground_truth_length": 49 }, { "character_accuracy": 0.9157894736842105, "edit_distance": 8, "normalized_edit_distance": 0.08421052631578947, "word_accuracy": 0.7857142857142857, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.22549019607843138, "edit_distance": 79, "normalized_edit_distance": 0.7745098039215687, "word_accuracy": 0.0, "length_ratio": 1.0408163265306123, "predicted_length": 102, "ground_truth_length": 98 }, { "character_accuracy": 0.2, "edit_distance": 8, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1, "edit_distance": 18, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 6, "ground_truth_length": 20 }, { "character_accuracy": 0.2, "edit_distance": 32, "normalized_edit_distance": 0.8, "word_accuracy": 0.07692307692307693, "length_ratio": 1.8181818181818181, "predicted_length": 40, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.2222222222222222, "predicted_length": 8, "ground_truth_length": 36 }, { "character_accuracy": 0.7727272727272727, "edit_distance": 10, "normalized_edit_distance": 0.22727272727272727, "word_accuracy": 0.2727272727272727, "length_ratio": 1.0, "predicted_length": 44, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.890625, "edit_distance": 7, "normalized_edit_distance": 0.109375, "word_accuracy": 0.5, "length_ratio": 0.984375, "predicted_length": 63, "ground_truth_length": 64 }, { "character_accuracy": 0.2761904761904762, "edit_distance": 76, "normalized_edit_distance": 0.7238095238095238, "word_accuracy": 0.0, "length_ratio": 1.105263157894737, "predicted_length": 105, "ground_truth_length": 95 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.125, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.5862068965517241, "edit_distance": 24, "normalized_edit_distance": 0.41379310344827586, "word_accuracy": 0.0, "length_ratio": 0.896551724137931, "predicted_length": 52, "ground_truth_length": 58 }, { "character_accuracy": 0.5454545454545454, "edit_distance": 20, "normalized_edit_distance": 0.45454545454545453, "word_accuracy": 0.15384615384615385, "length_ratio": 0.8863636363636364, "predicted_length": 39, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.78, "edit_distance": 11, "normalized_edit_distance": 0.22, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 12, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8518518518518519, "edit_distance": 8, "normalized_edit_distance": 0.14814814814814814, "word_accuracy": 0.5833333333333334, "length_ratio": 0.9444444444444444, "predicted_length": 51, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.2, "edit_distance": 16, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.65, "predicted_length": 13, "ground_truth_length": 20 }, { "character_accuracy": 0.2570093457943925, "edit_distance": 159, "normalized_edit_distance": 0.7429906542056075, "word_accuracy": 0.0, "length_ratio": 2.2061855670103094, "predicted_length": 214, "ground_truth_length": 97 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 10, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 6, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 11, "ground_truth_length": 22 }, { "character_accuracy": 0.2542372881355932, "edit_distance": 44, "normalized_edit_distance": 0.7457627118644068, "word_accuracy": 0.0, "length_ratio": 1.0727272727272728, "predicted_length": 59, "ground_truth_length": 55 }, { "character_accuracy": 0.25, "edit_distance": 6, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.625, "predicted_length": 5, "ground_truth_length": 8 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 7, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.4666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.5333333333333333, "word_accuracy": 0.25, "length_ratio": 0.8, "predicted_length": 12, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6363636363636364, "edit_distance": 20, "normalized_edit_distance": 0.36363636363636365, "word_accuracy": 0.08333333333333333, "length_ratio": 0.7272727272727273, "predicted_length": 40, "ground_truth_length": 55 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.4791666666666667, "edit_distance": 25, "normalized_edit_distance": 0.5208333333333334, "word_accuracy": 0.125, "length_ratio": 0.7916666666666666, "predicted_length": 38, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.8444444444444444, "edit_distance": 7, "normalized_edit_distance": 0.15555555555555556, "word_accuracy": 0.5, "length_ratio": 0.9111111111111111, "predicted_length": 41, "ground_truth_length": 45 }, { "character_accuracy": 0.72, "edit_distance": 14, "normalized_edit_distance": 0.28, "word_accuracy": 0.5555555555555556, "length_ratio": 0.82, "predicted_length": 41, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.23529411764705882, "edit_distance": 104, "normalized_edit_distance": 0.7647058823529411, "word_accuracy": 0.043478260869565216, "length_ratio": 1.4945054945054945, "predicted_length": 136, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.4117647058823529, "predicted_length": 7, "ground_truth_length": 17 }, { "character_accuracy": 0.2, "edit_distance": 32, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.525, "predicted_length": 21, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.23170731707317074, "edit_distance": 126, "normalized_edit_distance": 0.7682926829268293, "word_accuracy": 0.0, "length_ratio": 1.5769230769230769, "predicted_length": 164, "ground_truth_length": 104 }, { "character_accuracy": 0.2154696132596685, "edit_distance": 142, "normalized_edit_distance": 0.7845303867403315, "word_accuracy": 0.0, "length_ratio": 1.8854166666666667, "predicted_length": 181, "ground_truth_length": 96 }, { "character_accuracy": 0.35714285714285715, "edit_distance": 27, "normalized_edit_distance": 0.6428571428571429, "word_accuracy": 0.16666666666666666, "length_ratio": 0.7142857142857143, "predicted_length": 30, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 14, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.14285714285714285, "length_ratio": 0.8461538461538461, "predicted_length": 22, "ground_truth_length": 26 }, { "character_accuracy": 0.375, "edit_distance": 10, "normalized_edit_distance": 0.625, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.5932203389830508, "edit_distance": 24, "normalized_edit_distance": 0.4067796610169492, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6779661016949152, "predicted_length": 40, "ground_truth_length": 59 }, { "character_accuracy": 0.2, "edit_distance": 8, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.7, "predicted_length": 7, "ground_truth_length": 10 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 24, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.24528301886792453, "edit_distance": 40, "normalized_edit_distance": 0.7547169811320755, "word_accuracy": 0.18181818181818182, "length_ratio": 0.6415094339622641, "predicted_length": 34, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 2000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:27:40.643252", "loss": 0.813947338461876, "perplexity": 2.25679874420166, "min_loss": 0.40211907029151917, "max_loss": 1.342209815979004, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.37927251786728255, "avg_word_accuracy": 0.1984805951634899, "avg_edit_distance": 21.5, "avg_normalized_edit_distance": 0.6207274821327177, "avg_length_ratio": 0.6796414640674899, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.8, "edit_distance": 2, "normalized_edit_distance": 0.2, "word_accuracy": 0.3333333333333333, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.6415094339622641, "edit_distance": 19, "normalized_edit_distance": 0.3584905660377358, "word_accuracy": 0.4, "length_ratio": 0.7735849056603774, "predicted_length": 41, "ground_truth_length": 53 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.5697674418604651, "edit_distance": 37, "normalized_edit_distance": 0.43023255813953487, "word_accuracy": 0.6, "length_ratio": 0.7906976744186046, "predicted_length": 68, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.45454545454545453, "edit_distance": 30, "normalized_edit_distance": 0.5454545454545454, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 40, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.47368421052631576, "edit_distance": 10, "normalized_edit_distance": 0.5263157894736842, "word_accuracy": 0.0, "length_ratio": 0.6842105263157895, "predicted_length": 13, "ground_truth_length": 19 }, { "character_accuracy": 0.058823529411764705, "edit_distance": 16, "normalized_edit_distance": 0.9411764705882353, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.6862745098039216, "edit_distance": 16, "normalized_edit_distance": 0.3137254901960784, "word_accuracy": 0.5, "length_ratio": 0.803921568627451, "predicted_length": 41, "ground_truth_length": 51 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.2727272727272727, "predicted_length": 12, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.3, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.3541666666666667, "edit_distance": 31, "normalized_edit_distance": 0.6458333333333334, "word_accuracy": 0.4, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.43243243243243246, "edit_distance": 21, "normalized_edit_distance": 0.5675675675675675, "word_accuracy": 0.25, "length_ratio": 0.7837837837837838, "predicted_length": 29, "ground_truth_length": 37 }, { "character_accuracy": 0.3620689655172414, "edit_distance": 37, "normalized_edit_distance": 0.6379310344827587, "word_accuracy": 0.0, "length_ratio": 0.7758620689655172, "predicted_length": 45, "ground_truth_length": 58 }, { "character_accuracy": 0.022727272727272728, "edit_distance": 43, "normalized_edit_distance": 0.9772727272727273, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 10, "ground_truth_length": 44 }, { "character_accuracy": 0.15151515151515152, "edit_distance": 28, "normalized_edit_distance": 0.8484848484848485, "word_accuracy": 0.0, "length_ratio": 0.48484848484848486, "predicted_length": 16, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.2, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.5897435897435898, "edit_distance": 16, "normalized_edit_distance": 0.41025641025641024, "word_accuracy": 0.375, "length_ratio": 0.7948717948717948, "predicted_length": 31, "ground_truth_length": 39 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 35, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.6190476190476191, "predicted_length": 26, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8850574712643678, "edit_distance": 10, "normalized_edit_distance": 0.11494252873563218, "word_accuracy": 0.6428571428571429, "length_ratio": 1.0116279069767442, "predicted_length": 87, "ground_truth_length": 86 }, { "character_accuracy": 0.19298245614035087, "edit_distance": 92, "normalized_edit_distance": 0.8070175438596491, "word_accuracy": 0.03333333333333333, "length_ratio": 1.2, "predicted_length": 114, "ground_truth_length": 95 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 21, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.07142857142857142, "edit_distance": 13, "normalized_edit_distance": 0.9285714285714286, "word_accuracy": 0.0, "length_ratio": 0.35714285714285715, "predicted_length": 5, "ground_truth_length": 14 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 27, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 1.03125, "predicted_length": 33, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 28, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.3, "length_ratio": 0.7551020408163265, "predicted_length": 37, "ground_truth_length": 49 }, { "character_accuracy": 0.9157894736842105, "edit_distance": 8, "normalized_edit_distance": 0.08421052631578947, "word_accuracy": 0.7857142857142857, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.19387755102040816, "edit_distance": 79, "normalized_edit_distance": 0.8061224489795918, "word_accuracy": 0.0, "length_ratio": 0.5816326530612245, "predicted_length": 57, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.07692307692307693, "length_ratio": 1.6818181818181819, "predicted_length": 37, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.2222222222222222, "predicted_length": 8, "ground_truth_length": 36 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 76, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 1.0947368421052632, "predicted_length": 104, "ground_truth_length": 95 }, { "character_accuracy": 0.6216216216216216, "edit_distance": 14, "normalized_edit_distance": 0.3783783783783784, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8918918918918919, "predicted_length": 33, "ground_truth_length": 37 }, { "character_accuracy": 0.4482758620689655, "edit_distance": 32, "normalized_edit_distance": 0.5517241379310345, "word_accuracy": 0.09090909090909091, "length_ratio": 0.6896551724137931, "predicted_length": 40, "ground_truth_length": 58 }, { "character_accuracy": 0.4090909090909091, "edit_distance": 26, "normalized_edit_distance": 0.5909090909090909, "word_accuracy": 0.0, "length_ratio": 0.7045454545454546, "predicted_length": 31, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.08823529411764706, "edit_distance": 31, "normalized_edit_distance": 0.9117647058823529, "word_accuracy": 0.0, "length_ratio": 0.4117647058823529, "predicted_length": 14, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8333333333333334, "edit_distance": 9, "normalized_edit_distance": 0.16666666666666666, "word_accuracy": 0.46153846153846156, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2570093457943925, "edit_distance": 159, "normalized_edit_distance": 0.7429906542056075, "word_accuracy": 0.0, "length_ratio": 2.2061855670103094, "predicted_length": 214, "ground_truth_length": 97 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 10, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.6363636363636364, "predicted_length": 7, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.5454545454545454, "edit_distance": 10, "normalized_edit_distance": 0.45454545454545453, "word_accuracy": 0.3333333333333333, "length_ratio": 0.9545454545454546, "predicted_length": 21, "ground_truth_length": 22 }, { "character_accuracy": 0.23333333333333334, "edit_distance": 46, "normalized_edit_distance": 0.7666666666666667, "word_accuracy": 0.0, "length_ratio": 1.0909090909090908, "predicted_length": 60, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 10, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.0, "length_ratio": 0.5333333333333333, "predicted_length": 8, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.32727272727272727, "edit_distance": 37, "normalized_edit_distance": 0.6727272727272727, "word_accuracy": 0.0, "length_ratio": 0.509090909090909, "predicted_length": 28, "ground_truth_length": 55 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.19642857142857142, "edit_distance": 90, "normalized_edit_distance": 0.8035714285714286, "word_accuracy": 0.0, "length_ratio": 0.8660714285714286, "predicted_length": 97, "ground_truth_length": 112 }, { "character_accuracy": 0.625, "edit_distance": 18, "normalized_edit_distance": 0.375, "word_accuracy": 0.3, "length_ratio": 0.7708333333333334, "predicted_length": 37, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.7555555555555555, "edit_distance": 11, "normalized_edit_distance": 0.24444444444444444, "word_accuracy": 0.4166666666666667, "length_ratio": 1.0, "predicted_length": 45, "ground_truth_length": 45 }, { "character_accuracy": 0.3, "edit_distance": 35, "normalized_edit_distance": 0.7, "word_accuracy": 0.2222222222222222, "length_ratio": 0.52, "predicted_length": 26, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.23404255319148937, "edit_distance": 72, "normalized_edit_distance": 0.7659574468085106, "word_accuracy": 0.0625, "length_ratio": 1.032967032967033, "predicted_length": 94, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.4117647058823529, "predicted_length": 7, "ground_truth_length": 17 }, { "character_accuracy": 0.225, "edit_distance": 31, "normalized_edit_distance": 0.775, "word_accuracy": 0.0, "length_ratio": 0.425, "predicted_length": 17, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.23404255319148937, "edit_distance": 108, "normalized_edit_distance": 0.7659574468085106, "word_accuracy": 0.10810810810810811, "length_ratio": 1.3557692307692308, "predicted_length": 141, "ground_truth_length": 104 }, { "character_accuracy": 0.84375, "edit_distance": 15, "normalized_edit_distance": 0.15625, "word_accuracy": 0.631578947368421, "length_ratio": 0.90625, "predicted_length": 87, "ground_truth_length": 96 }, { "character_accuracy": 0.7380952380952381, "edit_distance": 11, "normalized_edit_distance": 0.2619047619047619, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.6538461538461539, "edit_distance": 9, "normalized_edit_distance": 0.34615384615384615, "word_accuracy": 0.3333333333333333, "length_ratio": 0.7692307692307693, "predicted_length": 20, "ground_truth_length": 26 }, { "character_accuracy": 0.375, "edit_distance": 10, "normalized_edit_distance": 0.625, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8813559322033898, "edit_distance": 7, "normalized_edit_distance": 0.11864406779661017, "word_accuracy": 0.6363636363636364, "length_ratio": 0.9661016949152542, "predicted_length": 57, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 24, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.7924528301886793, "edit_distance": 11, "normalized_edit_distance": 0.20754716981132076, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9245283018867925, "predicted_length": 49, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 2500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:28:51.951135", "loss": 0.7890318787097931, "perplexity": 2.2012643814086914, "min_loss": 0.35444435477256775, "max_loss": 1.3153470754623413, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.384571464565812, "avg_word_accuracy": 0.1893172105672106, "avg_edit_distance": 22.12, "avg_normalized_edit_distance": 0.6154285354341882, "avg_length_ratio": 0.731354611338375, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 5, "ground_truth_length": 10 }, { "character_accuracy": 0.37735849056603776, "edit_distance": 33, "normalized_edit_distance": 0.6226415094339622, "word_accuracy": 0.08333333333333333, "length_ratio": 0.6037735849056604, "predicted_length": 32, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.46511627906976744, "edit_distance": 46, "normalized_edit_distance": 0.5348837209302325, "word_accuracy": 0.5714285714285714, "length_ratio": 0.813953488372093, "predicted_length": 70, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.5636363636363636, "edit_distance": 24, "normalized_edit_distance": 0.43636363636363634, "word_accuracy": 0.0, "length_ratio": 0.7636363636363637, "predicted_length": 42, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.35714285714285715, "edit_distance": 27, "normalized_edit_distance": 0.6428571428571429, "word_accuracy": 0.0, "length_ratio": 0.8333333333333334, "predicted_length": 35, "ground_truth_length": 42 }, { "character_accuracy": 0.4, "edit_distance": 3, "normalized_edit_distance": 0.6, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.32, "edit_distance": 17, "normalized_edit_distance": 0.68, "word_accuracy": 0.0, "length_ratio": 1.3157894736842106, "predicted_length": 25, "ground_truth_length": 19 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.9019607843137255, "edit_distance": 5, "normalized_edit_distance": 0.09803921568627451, "word_accuracy": 0.5, "length_ratio": 0.9803921568627451, "predicted_length": 50, "ground_truth_length": 51 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3409090909090909, "predicted_length": 15, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.3541666666666667, "edit_distance": 31, "normalized_edit_distance": 0.6458333333333334, "word_accuracy": 0.4, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.43243243243243246, "edit_distance": 21, "normalized_edit_distance": 0.5675675675675675, "word_accuracy": 0.25, "length_ratio": 0.7837837837837838, "predicted_length": 29, "ground_truth_length": 37 }, { "character_accuracy": 0.7758620689655172, "edit_distance": 13, "normalized_edit_distance": 0.22413793103448276, "word_accuracy": 0.3076923076923077, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.06818181818181818, "edit_distance": 41, "normalized_edit_distance": 0.9318181818181818, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 11, "ground_truth_length": 44 }, { "character_accuracy": 0.30303030303030304, "edit_distance": 23, "normalized_edit_distance": 0.696969696969697, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 18, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.2, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.9487179487179487, "edit_distance": 2, "normalized_edit_distance": 0.05128205128205128, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9487179487179487, "predicted_length": 37, "ground_truth_length": 39 }, { "character_accuracy": 0.19047619047619047, "edit_distance": 34, "normalized_edit_distance": 0.8095238095238095, "word_accuracy": 0.0, "length_ratio": 0.6190476190476191, "predicted_length": 26, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8837209302325582, "edit_distance": 10, "normalized_edit_distance": 0.11627906976744186, "word_accuracy": 0.5714285714285714, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 21, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.07142857142857142, "edit_distance": 13, "normalized_edit_distance": 0.9285714285714286, "word_accuracy": 0.0, "length_ratio": 0.35714285714285715, "predicted_length": 5, "ground_truth_length": 14 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 30, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.1875, "predicted_length": 38, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.3469387755102041, "edit_distance": 32, "normalized_edit_distance": 0.6530612244897959, "word_accuracy": 0.18181818181818182, "length_ratio": 0.673469387755102, "predicted_length": 33, "ground_truth_length": 49 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8461538461538461, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.22099447513812154, "edit_distance": 141, "normalized_edit_distance": 0.7790055248618785, "word_accuracy": 0.0, "length_ratio": 1.846938775510204, "predicted_length": 181, "ground_truth_length": 98 }, { "character_accuracy": 0.2, "edit_distance": 8, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1, "edit_distance": 18, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 6, "ground_truth_length": 20 }, { "character_accuracy": 0.18421052631578946, "edit_distance": 31, "normalized_edit_distance": 0.8157894736842105, "word_accuracy": 0.07692307692307693, "length_ratio": 1.7272727272727273, "predicted_length": 38, "ground_truth_length": 22 }, { "character_accuracy": 0.1388888888888889, "edit_distance": 31, "normalized_edit_distance": 0.8611111111111112, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 9, "ground_truth_length": 36 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 76, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 1.0947368421052632, "predicted_length": 104, "ground_truth_length": 95 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.0, "length_ratio": 0.4594594594594595, "predicted_length": 17, "ground_truth_length": 37 }, { "character_accuracy": 0.2413793103448276, "edit_distance": 44, "normalized_edit_distance": 0.7586206896551724, "word_accuracy": 0.07692307692307693, "length_ratio": 0.8620689655172413, "predicted_length": 50, "ground_truth_length": 58 }, { "character_accuracy": 0.5909090909090909, "edit_distance": 18, "normalized_edit_distance": 0.4090909090909091, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7272727272727273, "predicted_length": 32, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.7777777777777778, "edit_distance": 12, "normalized_edit_distance": 0.2222222222222222, "word_accuracy": 0.5, "length_ratio": 0.9259259259259259, "predicted_length": 50, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.24378109452736318, "edit_distance": 152, "normalized_edit_distance": 0.7562189054726368, "word_accuracy": 0.0, "length_ratio": 2.0721649484536084, "predicted_length": 201, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.25, "edit_distance": 78, "normalized_edit_distance": 0.75, "word_accuracy": 0.3076923076923077, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 11, "ground_truth_length": 22 }, { "character_accuracy": 0.25, "edit_distance": 45, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.0909090909090908, "predicted_length": 60, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.0, "edit_distance": 15, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4666666666666667, "predicted_length": 7, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.5636363636363636, "edit_distance": 24, "normalized_edit_distance": 0.43636363636363634, "word_accuracy": 0.2, "length_ratio": 0.6909090909090909, "predicted_length": 38, "ground_truth_length": 55 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.24107142857142858, "edit_distance": 85, "normalized_edit_distance": 0.7589285714285714, "word_accuracy": 0.0, "length_ratio": 0.5357142857142857, "predicted_length": 60, "ground_truth_length": 112 }, { "character_accuracy": 0.6875, "edit_distance": 15, "normalized_edit_distance": 0.3125, "word_accuracy": 0.3, "length_ratio": 0.8125, "predicted_length": 39, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.717391304347826, "edit_distance": 13, "normalized_edit_distance": 0.2826086956521739, "word_accuracy": 0.4166666666666667, "length_ratio": 1.0222222222222221, "predicted_length": 46, "ground_truth_length": 45 }, { "character_accuracy": 0.92, "edit_distance": 4, "normalized_edit_distance": 0.08, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.23404255319148937, "edit_distance": 72, "normalized_edit_distance": 0.7659574468085106, "word_accuracy": 0.06666666666666667, "length_ratio": 1.032967032967033, "predicted_length": 94, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.29411764705882354, "predicted_length": 5, "ground_truth_length": 17 }, { "character_accuracy": 0.125, "edit_distance": 35, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.7884615384615384, "edit_distance": 22, "normalized_edit_distance": 0.21153846153846154, "word_accuracy": 0.5454545454545454, "length_ratio": 0.8846153846153846, "predicted_length": 92, "ground_truth_length": 104 }, { "character_accuracy": 0.21608040201005024, "edit_distance": 156, "normalized_edit_distance": 0.7839195979899497, "word_accuracy": 0.0, "length_ratio": 2.0729166666666665, "predicted_length": 199, "ground_truth_length": 96 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.2727272727272727, "length_ratio": 0.7142857142857143, "predicted_length": 30, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.5, "edit_distance": 13, "normalized_edit_distance": 0.5, "word_accuracy": 0.14285714285714285, "length_ratio": 0.8846153846153846, "predicted_length": 23, "ground_truth_length": 26 }, { "character_accuracy": 0.5625, "edit_distance": 7, "normalized_edit_distance": 0.4375, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 12, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.3898305084745763, "edit_distance": 36, "normalized_edit_distance": 0.6101694915254238, "word_accuracy": 0.16666666666666666, "length_ratio": 0.6271186440677966, "predicted_length": 37, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 24, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.4528301886792453, "edit_distance": 29, "normalized_edit_distance": 0.5471698113207547, "word_accuracy": 0.15384615384615385, "length_ratio": 0.7169811320754716, "predicted_length": 38, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 3000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:30:02.639985", "loss": 0.7793132990598679, "perplexity": 2.1799747943878174, "min_loss": 0.40687626600265503, "max_loss": 1.3542389869689941, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.3932117182912491, "avg_word_accuracy": 0.19454997632226737, "avg_edit_distance": 19.84, "avg_normalized_edit_distance": 0.6067882817087509, "avg_length_ratio": 0.7107252615615305, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.7169811320754716, "edit_distance": 15, "normalized_edit_distance": 0.2830188679245283, "word_accuracy": 0.25, "length_ratio": 0.8490566037735849, "predicted_length": 45, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.12790697674418605, "edit_distance": 75, "normalized_edit_distance": 0.872093023255814, "word_accuracy": 0.06666666666666667, "length_ratio": 0.6627906976744186, "predicted_length": 57, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.5454545454545454, "edit_distance": 25, "normalized_edit_distance": 0.45454545454545453, "word_accuracy": 0.0, "length_ratio": 0.7636363636363637, "predicted_length": 42, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.2631578947368421, "edit_distance": 14, "normalized_edit_distance": 0.7368421052631579, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.2727272727272727, "predicted_length": 12, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.3541666666666667, "edit_distance": 31, "normalized_edit_distance": 0.6458333333333334, "word_accuracy": 0.4, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.1111111111111111, "length_ratio": 0.7837837837837838, "predicted_length": 29, "ground_truth_length": 37 }, { "character_accuracy": 0.29310344827586204, "edit_distance": 41, "normalized_edit_distance": 0.7068965517241379, "word_accuracy": 0.0, "length_ratio": 0.896551724137931, "predicted_length": 52, "ground_truth_length": 58 }, { "character_accuracy": 0.7727272727272727, "edit_distance": 10, "normalized_edit_distance": 0.22727272727272727, "word_accuracy": 0.2727272727272727, "length_ratio": 1.0, "predicted_length": 44, "ground_truth_length": 44 }, { "character_accuracy": 0.21212121212121213, "edit_distance": 26, "normalized_edit_distance": 0.7878787878787878, "word_accuracy": 0.0, "length_ratio": 0.5151515151515151, "predicted_length": 17, "ground_truth_length": 33 }, { "character_accuracy": 0.8620689655172413, "edit_distance": 8, "normalized_edit_distance": 0.13793103448275862, "word_accuracy": 0.6153846153846154, "length_ratio": 0.9655172413793104, "predicted_length": 56, "ground_truth_length": 58 }, { "character_accuracy": 0.5208333333333334, "edit_distance": 23, "normalized_edit_distance": 0.4791666666666667, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 36, "ground_truth_length": 48 }, { "character_accuracy": 0.5128205128205128, "edit_distance": 19, "normalized_edit_distance": 0.48717948717948717, "word_accuracy": 0.25, "length_ratio": 0.6410256410256411, "predicted_length": 25, "ground_truth_length": 39 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 35, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.47619047619047616, "predicted_length": 20, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8837209302325582, "edit_distance": 10, "normalized_edit_distance": 0.11627906976744186, "word_accuracy": 0.5714285714285714, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.5128205128205128, "edit_distance": 19, "normalized_edit_distance": 0.48717948717948717, "word_accuracy": 0.3, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 12, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.35714285714285715, "predicted_length": 5, "ground_truth_length": 14 }, { "character_accuracy": 0.1875, "edit_distance": 26, "normalized_edit_distance": 0.8125, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 24, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.22448979591836735, "edit_distance": 38, "normalized_edit_distance": 0.7755102040816326, "word_accuracy": 0.16666666666666666, "length_ratio": 0.7142857142857143, "predicted_length": 35, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.3025210084033613, "edit_distance": 83, "normalized_edit_distance": 0.6974789915966386, "word_accuracy": 0.0, "length_ratio": 1.2142857142857142, "predicted_length": 119, "ground_truth_length": 98 }, { "character_accuracy": 0.2, "edit_distance": 8, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 3, "ground_truth_length": 10 }, { "character_accuracy": 0.35365853658536583, "edit_distance": 53, "normalized_edit_distance": 0.6463414634146342, "word_accuracy": 0.11764705882352941, "length_ratio": 0.8048780487804879, "predicted_length": 66, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.18421052631578946, "edit_distance": 31, "normalized_edit_distance": 0.8157894736842105, "word_accuracy": 0.07692307692307693, "length_ratio": 1.7272727272727273, "predicted_length": 38, "ground_truth_length": 22 }, { "character_accuracy": 0.75, "edit_distance": 9, "normalized_edit_distance": 0.25, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8888888888888888, "predicted_length": 32, "ground_truth_length": 36 }, { "character_accuracy": 0.75, "edit_distance": 11, "normalized_edit_distance": 0.25, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.9375, "edit_distance": 4, "normalized_edit_distance": 0.0625, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 64, "ground_truth_length": 64 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 76, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 1.0947368421052632, "predicted_length": 104, "ground_truth_length": 95 }, { "character_accuracy": 0.16216216216216217, "edit_distance": 31, "normalized_edit_distance": 0.8378378378378378, "word_accuracy": 0.0, "length_ratio": 0.5405405405405406, "predicted_length": 20, "ground_truth_length": 37 }, { "character_accuracy": 0.7931034482758621, "edit_distance": 12, "normalized_edit_distance": 0.20689655172413793, "word_accuracy": 0.09090909090909091, "length_ratio": 0.9482758620689655, "predicted_length": 55, "ground_truth_length": 58 }, { "character_accuracy": 0.25, "edit_distance": 33, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 24, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.3235294117647059, "edit_distance": 23, "normalized_edit_distance": 0.6764705882352942, "word_accuracy": 0.125, "length_ratio": 0.6764705882352942, "predicted_length": 23, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8148148148148148, "edit_distance": 10, "normalized_edit_distance": 0.18518518518518517, "word_accuracy": 0.26666666666666666, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2570093457943925, "edit_distance": 159, "normalized_edit_distance": 0.7429906542056075, "word_accuracy": 0.0, "length_ratio": 2.2061855670103094, "predicted_length": 214, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 11, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 6, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.045454545454545456, "edit_distance": 21, "normalized_edit_distance": 0.9545454545454546, "word_accuracy": 0.0, "length_ratio": 0.36363636363636365, "predicted_length": 8, "ground_truth_length": 22 }, { "character_accuracy": 0.25, "edit_distance": 45, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.0909090909090908, "predicted_length": 60, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 3, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.0, "length_ratio": 1.2857142857142858, "predicted_length": 9, "ground_truth_length": 7 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 5, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.06666666666666667, "edit_distance": 14, "normalized_edit_distance": 0.9333333333333333, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 6, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.4, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.625, "edit_distance": 18, "normalized_edit_distance": 0.375, "word_accuracy": 0.3, "length_ratio": 0.7708333333333334, "predicted_length": 37, "ground_truth_length": 48 }, { "character_accuracy": 0.0625, "edit_distance": 15, "normalized_edit_distance": 0.9375, "word_accuracy": 0.0, "length_ratio": 0.375, "predicted_length": 6, "ground_truth_length": 16 }, { "character_accuracy": 0.8222222222222222, "edit_distance": 8, "normalized_edit_distance": 0.17777777777777778, "word_accuracy": 0.6, "length_ratio": 0.9555555555555556, "predicted_length": 43, "ground_truth_length": 45 }, { "character_accuracy": 0.92, "edit_distance": 4, "normalized_edit_distance": 0.08, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.7127659574468085, "edit_distance": 27, "normalized_edit_distance": 0.2872340425531915, "word_accuracy": 0.3157894736842105, "length_ratio": 1.032967032967033, "predicted_length": 94, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.29411764705882354, "predicted_length": 5, "ground_truth_length": 17 }, { "character_accuracy": 0.2, "edit_distance": 32, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.425, "predicted_length": 17, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.25, "edit_distance": 3, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 4, "ground_truth_length": 3 }, { "character_accuracy": 0.22115384615384615, "edit_distance": 81, "normalized_edit_distance": 0.7788461538461539, "word_accuracy": 0.0, "length_ratio": 0.9134615384615384, "predicted_length": 95, "ground_truth_length": 104 }, { "character_accuracy": 0.7604166666666666, "edit_distance": 23, "normalized_edit_distance": 0.23958333333333334, "word_accuracy": 0.5263157894736842, "length_ratio": 0.8333333333333334, "predicted_length": 80, "ground_truth_length": 96 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 12, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 19, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 0.5769230769230769, "predicted_length": 15, "ground_truth_length": 26 }, { "character_accuracy": 0.5625, "edit_distance": 7, "normalized_edit_distance": 0.4375, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 12, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8813559322033898, "edit_distance": 7, "normalized_edit_distance": 0.11864406779661017, "word_accuracy": 0.6363636363636364, "length_ratio": 0.9661016949152542, "predicted_length": 57, "ground_truth_length": 59 }, { "character_accuracy": 0.2, "edit_distance": 8, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 6, "ground_truth_length": 10 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 24, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.5283018867924528, "edit_distance": 25, "normalized_edit_distance": 0.4716981132075472, "word_accuracy": 0.25, "length_ratio": 0.7547169811320755, "predicted_length": 40, "ground_truth_length": 53 }, { "character_accuracy": 0.7868852459016393, "edit_distance": 13, "normalized_edit_distance": 0.21311475409836064, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 3500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:31:13.650891", "loss": 0.7638715761899948, "perplexity": 2.1465706825256348, "min_loss": 0.37659427523612976, "max_loss": 1.35121488571167, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.4269453094792285, "avg_word_accuracy": 0.21375291643640013, "avg_edit_distance": 17.26, "avg_normalized_edit_distance": 0.5730546905207714, "avg_length_ratio": 0.7233992824713151, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.6792452830188679, "edit_distance": 17, "normalized_edit_distance": 0.32075471698113206, "word_accuracy": 0.25, "length_ratio": 0.8301886792452831, "predicted_length": 44, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.46511627906976744, "edit_distance": 46, "normalized_edit_distance": 0.5348837209302325, "word_accuracy": 0.5714285714285714, "length_ratio": 0.813953488372093, "predicted_length": 70, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6727272727272727, "edit_distance": 18, "normalized_edit_distance": 0.32727272727272727, "word_accuracy": 0.0, "length_ratio": 0.8545454545454545, "predicted_length": 47, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 28, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.0, "length_ratio": 0.9047619047619048, "predicted_length": 38, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8571428571428571, "predicted_length": 6, "ground_truth_length": 7 }, { "character_accuracy": 0.6862745098039216, "edit_distance": 16, "normalized_edit_distance": 0.3137254901960784, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.11363636363636363, "edit_distance": 39, "normalized_edit_distance": 0.8863636363636364, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 11, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.5833333333333334, "edit_distance": 20, "normalized_edit_distance": 0.4166666666666667, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6875, "predicted_length": 33, "ground_truth_length": 48 }, { "character_accuracy": 0.8490566037735849, "edit_distance": 8, "normalized_edit_distance": 0.1509433962264151, "word_accuracy": 0.7272727272727273, "length_ratio": 0.9245283018867925, "predicted_length": 49, "ground_truth_length": 53 }, { "character_accuracy": 0.21621621621621623, "edit_distance": 29, "normalized_edit_distance": 0.7837837837837838, "word_accuracy": 0.1, "length_ratio": 0.8108108108108109, "predicted_length": 30, "ground_truth_length": 37 }, { "character_accuracy": 0.3793103448275862, "edit_distance": 36, "normalized_edit_distance": 0.6206896551724138, "word_accuracy": 0.0, "length_ratio": 0.7931034482758621, "predicted_length": 46, "ground_truth_length": 58 }, { "character_accuracy": 0.8, "edit_distance": 9, "normalized_edit_distance": 0.2, "word_accuracy": 0.16666666666666666, "length_ratio": 1.0227272727272727, "predicted_length": 45, "ground_truth_length": 44 }, { "character_accuracy": 0.6060606060606061, "edit_distance": 13, "normalized_edit_distance": 0.3939393939393939, "word_accuracy": 0.125, "length_ratio": 0.6666666666666666, "predicted_length": 22, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.5208333333333334, "edit_distance": 23, "normalized_edit_distance": 0.4791666666666667, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 36, "ground_truth_length": 48 }, { "character_accuracy": 0.6410256410256411, "edit_distance": 14, "normalized_edit_distance": 0.358974358974359, "word_accuracy": 0.2, "length_ratio": 0.9487179487179487, "predicted_length": 37, "ground_truth_length": 39 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 35, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.1, "length_ratio": 0.35714285714285715, "predicted_length": 15, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.5462962962962963, "edit_distance": 49, "normalized_edit_distance": 0.4537037037037037, "word_accuracy": 0.23809523809523808, "length_ratio": 1.255813953488372, "predicted_length": 108, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.4444444444444444, "length_ratio": 0.8461538461538461, "predicted_length": 33, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 12, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 7, "ground_truth_length": 14 }, { "character_accuracy": 0.21875, "edit_distance": 25, "normalized_edit_distance": 0.78125, "word_accuracy": 0.0, "length_ratio": 0.78125, "predicted_length": 25, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8571428571428571, "edit_distance": 7, "normalized_edit_distance": 0.14285714285714285, "word_accuracy": 0.6, "length_ratio": 1.0, "predicted_length": 49, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.40816326530612246, "edit_distance": 58, "normalized_edit_distance": 0.5918367346938775, "word_accuracy": 0.09090909090909091, "length_ratio": 0.8775510204081632, "predicted_length": 86, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.4268292682926829, "edit_distance": 47, "normalized_edit_distance": 0.573170731707317, "word_accuracy": 0.23529411764705882, "length_ratio": 0.8048780487804879, "predicted_length": 66, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.18421052631578946, "edit_distance": 31, "normalized_edit_distance": 0.8157894736842105, "word_accuracy": 0.07692307692307693, "length_ratio": 1.7272727272727273, "predicted_length": 38, "ground_truth_length": 22 }, { "character_accuracy": 0.7222222222222222, "edit_distance": 10, "normalized_edit_distance": 0.2777777777777778, "word_accuracy": 0.25, "length_ratio": 0.8611111111111112, "predicted_length": 31, "ground_truth_length": 36 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9772727272727273, "predicted_length": 43, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.9375, "edit_distance": 4, "normalized_edit_distance": 0.0625, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 64, "ground_truth_length": 64 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 76, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 1.0947368421052632, "predicted_length": 104, "ground_truth_length": 95 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.0, "length_ratio": 0.6756756756756757, "predicted_length": 25, "ground_truth_length": 37 }, { "character_accuracy": 0.7241379310344828, "edit_distance": 16, "normalized_edit_distance": 0.27586206896551724, "word_accuracy": 0.08333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.6818181818181818, "edit_distance": 14, "normalized_edit_distance": 0.3181818181818182, "word_accuracy": 0.3, "length_ratio": 0.7954545454545454, "predicted_length": 35, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.7222222222222222, "edit_distance": 15, "normalized_edit_distance": 0.2777777777777778, "word_accuracy": 0.2, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.7731958762886598, "edit_distance": 22, "normalized_edit_distance": 0.2268041237113402, "word_accuracy": 0.391304347826087, "length_ratio": 0.9072164948453608, "predicted_length": 88, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 20, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 7, "ground_truth_length": 22 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 10, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.4166666666666667, "length_ratio": 0.8727272727272727, "predicted_length": 48, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.2, "edit_distance": 12, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 6, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.8545454545454545, "edit_distance": 8, "normalized_edit_distance": 0.14545454545454545, "word_accuracy": 0.4166666666666667, "length_ratio": 1.0, "predicted_length": 55, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.2916666666666667, "edit_distance": 34, "normalized_edit_distance": 0.7083333333333334, "word_accuracy": 0.3, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.717391304347826, "edit_distance": 13, "normalized_edit_distance": 0.2826086956521739, "word_accuracy": 0.4166666666666667, "length_ratio": 1.0222222222222221, "predicted_length": 46, "ground_truth_length": 45 }, { "character_accuracy": 0.9, "edit_distance": 5, "normalized_edit_distance": 0.1, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.5494505494505495, "edit_distance": 41, "normalized_edit_distance": 0.45054945054945056, "word_accuracy": 0.25, "length_ratio": 0.9560439560439561, "predicted_length": 87, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.29411764705882354, "predicted_length": 5, "ground_truth_length": 17 }, { "character_accuracy": 0.25, "edit_distance": 30, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.25, "edit_distance": 3, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 4, "ground_truth_length": 3 }, { "character_accuracy": 0.2, "edit_distance": 88, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 1.0576923076923077, "predicted_length": 110, "ground_truth_length": 104 }, { "character_accuracy": 0.8125, "edit_distance": 18, "normalized_edit_distance": 0.1875, "word_accuracy": 0.5789473684210527, "length_ratio": 0.8854166666666666, "predicted_length": 85, "ground_truth_length": 96 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 12, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.34615384615384615, "edit_distance": 17, "normalized_edit_distance": 0.6538461538461539, "word_accuracy": 0.0, "length_ratio": 0.6923076923076923, "predicted_length": 18, "ground_truth_length": 26 }, { "character_accuracy": 0.5625, "edit_distance": 7, "normalized_edit_distance": 0.4375, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 12, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8813559322033898, "edit_distance": 7, "normalized_edit_distance": 0.11864406779661017, "word_accuracy": 0.6363636363636364, "length_ratio": 0.9661016949152542, "predicted_length": 57, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.4528301886792453, "edit_distance": 29, "normalized_edit_distance": 0.5471698113207547, "word_accuracy": 0.15384615384615385, "length_ratio": 0.7358490566037735, "predicted_length": 39, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 4000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:32:24.191288", "loss": 0.7483316981792449, "perplexity": 2.113471269607544, "min_loss": 0.35888415575027466, "max_loss": 1.2802503108978271, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.4118163000520416, "avg_word_accuracy": 0.20419987234987233, "avg_edit_distance": 18.52, "avg_normalized_edit_distance": 0.5881836999479584, "avg_length_ratio": 0.6893215488281613, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.6415094339622641, "edit_distance": 19, "normalized_edit_distance": 0.3584905660377358, "word_accuracy": 0.4, "length_ratio": 0.7735849056603774, "predicted_length": 41, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.10465116279069768, "edit_distance": 77, "normalized_edit_distance": 0.8953488372093024, "word_accuracy": 0.0, "length_ratio": 0.29069767441860467, "predicted_length": 25, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.5818181818181818, "edit_distance": 23, "normalized_edit_distance": 0.41818181818181815, "word_accuracy": 0.0, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 14, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.14285714285714285, "length_ratio": 0.8095238095238095, "predicted_length": 34, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3409090909090909, "predicted_length": 15, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 32, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.2727272727272727, "length_ratio": 0.5625, "predicted_length": 27, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.1111111111111111, "length_ratio": 0.7837837837837838, "predicted_length": 29, "ground_truth_length": 37 }, { "character_accuracy": 0.7068965517241379, "edit_distance": 17, "normalized_edit_distance": 0.29310344827586204, "word_accuracy": 0.3333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.29545454545454547, "predicted_length": 13, "ground_truth_length": 44 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5384615384615384, "edit_distance": 18, "normalized_edit_distance": 0.46153846153846156, "word_accuracy": 0.25, "length_ratio": 0.6666666666666666, "predicted_length": 26, "ground_truth_length": 39 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 18, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8850574712643678, "edit_distance": 10, "normalized_edit_distance": 0.11494252873563218, "word_accuracy": 0.6428571428571429, "length_ratio": 1.0116279069767442, "predicted_length": 87, "ground_truth_length": 86 }, { "character_accuracy": 0.6631578947368421, "edit_distance": 32, "normalized_edit_distance": 0.3368421052631579, "word_accuracy": 0.23809523809523808, "length_ratio": 0.8, "predicted_length": 76, "ground_truth_length": 95 }, { "character_accuracy": 0.48717948717948717, "edit_distance": 20, "normalized_edit_distance": 0.5128205128205128, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 12, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 4, "ground_truth_length": 14 }, { "character_accuracy": 0.28125, "edit_distance": 23, "normalized_edit_distance": 0.71875, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 24, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8775510204081632, "edit_distance": 6, "normalized_edit_distance": 0.12244897959183673, "word_accuracy": 0.6, "length_ratio": 0.9591836734693877, "predicted_length": 47, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.37755102040816324, "edit_distance": 61, "normalized_edit_distance": 0.6224489795918368, "word_accuracy": 0.05555555555555555, "length_ratio": 0.9081632653061225, "predicted_length": 89, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.2222222222222222, "edit_distance": 21, "normalized_edit_distance": 0.7777777777777778, "word_accuracy": 0.2222222222222222, "length_ratio": 1.2272727272727273, "predicted_length": 27, "ground_truth_length": 22 }, { "character_accuracy": 0.7222222222222222, "edit_distance": 10, "normalized_edit_distance": 0.2777777777777778, "word_accuracy": 0.25, "length_ratio": 0.8611111111111112, "predicted_length": 31, "ground_truth_length": 36 }, { "character_accuracy": 0.5227272727272727, "edit_distance": 21, "normalized_edit_distance": 0.4772727272727273, "word_accuracy": 0.0, "length_ratio": 0.8409090909090909, "predicted_length": 37, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.2692307692307692, "edit_distance": 76, "normalized_edit_distance": 0.7307692307692307, "word_accuracy": 0.0, "length_ratio": 1.0947368421052632, "predicted_length": 104, "ground_truth_length": 95 }, { "character_accuracy": 0.16216216216216217, "edit_distance": 31, "normalized_edit_distance": 0.8378378378378378, "word_accuracy": 0.0, "length_ratio": 0.40540540540540543, "predicted_length": 15, "ground_truth_length": 37 }, { "character_accuracy": 0.8103448275862069, "edit_distance": 11, "normalized_edit_distance": 0.1896551724137931, "word_accuracy": 0.09090909090909091, "length_ratio": 0.9482758620689655, "predicted_length": 55, "ground_truth_length": 58 }, { "character_accuracy": 0.38636363636363635, "edit_distance": 27, "normalized_edit_distance": 0.6136363636363636, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 32, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.7222222222222222, "edit_distance": 15, "normalized_edit_distance": 0.2777777777777778, "word_accuracy": 0.2, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 16, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 12, "ground_truth_length": 22 }, { "character_accuracy": 0.2786885245901639, "edit_distance": 44, "normalized_edit_distance": 0.7213114754098361, "word_accuracy": 0.0, "length_ratio": 1.1090909090909091, "predicted_length": 61, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.4666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.5333333333333333, "word_accuracy": 0.25, "length_ratio": 0.8, "predicted_length": 12, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7454545454545455, "edit_distance": 14, "normalized_edit_distance": 0.2545454545454545, "word_accuracy": 0.2727272727272727, "length_ratio": 0.8, "predicted_length": 44, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.625, "edit_distance": 18, "normalized_edit_distance": 0.375, "word_accuracy": 0.3, "length_ratio": 0.7708333333333334, "predicted_length": 37, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.8222222222222222, "edit_distance": 8, "normalized_edit_distance": 0.17777777777777778, "word_accuracy": 0.5, "length_ratio": 0.9333333333333333, "predicted_length": 42, "ground_truth_length": 45 }, { "character_accuracy": 0.92, "edit_distance": 4, "normalized_edit_distance": 0.08, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.6153846153846154, "edit_distance": 35, "normalized_edit_distance": 0.38461538461538464, "word_accuracy": 0.23809523809523808, "length_ratio": 0.978021978021978, "predicted_length": 89, "ground_truth_length": 91 }, { "character_accuracy": 0.47058823529411764, "edit_distance": 9, "normalized_edit_distance": 0.5294117647058824, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.275, "edit_distance": 29, "normalized_edit_distance": 0.725, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.7980769230769231, "edit_distance": 21, "normalized_edit_distance": 0.20192307692307693, "word_accuracy": 0.65, "length_ratio": 0.875, "predicted_length": 91, "ground_truth_length": 104 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 22, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8958333333333334, "predicted_length": 86, "ground_truth_length": 96 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 12, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.38461538461538464, "edit_distance": 16, "normalized_edit_distance": 0.6153846153846154, "word_accuracy": 0.16666666666666666, "length_ratio": 0.6153846153846154, "predicted_length": 16, "ground_truth_length": 26 }, { "character_accuracy": 0.375, "edit_distance": 10, "normalized_edit_distance": 0.625, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.9333333333333333, "edit_distance": 4, "normalized_edit_distance": 0.06666666666666667, "word_accuracy": 0.7272727272727273, "length_ratio": 1.0169491525423728, "predicted_length": 60, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.12121212121212122, "edit_distance": 29, "normalized_edit_distance": 0.8787878787878788, "word_accuracy": 0.0, "length_ratio": 0.36363636363636365, "predicted_length": 12, "ground_truth_length": 33 }, { "character_accuracy": 0.4528301886792453, "edit_distance": 29, "normalized_edit_distance": 0.5471698113207547, "word_accuracy": 0.15384615384615385, "length_ratio": 0.7169811320754716, "predicted_length": 38, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 4500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:33:35.700383", "loss": 0.7466108947992325, "perplexity": 2.109837293624878, "min_loss": 0.3643028736114502, "max_loss": 1.3511654138565063, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.37289818752321646, "avg_word_accuracy": 0.18751171032270098, "avg_edit_distance": 22.77, "avg_normalized_edit_distance": 0.6271018124767838, "avg_length_ratio": 0.7063605980348483, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.6415094339622641, "edit_distance": 19, "normalized_edit_distance": 0.3584905660377358, "word_accuracy": 0.4, "length_ratio": 0.7735849056603774, "predicted_length": 41, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.20618556701030927, "edit_distance": 77, "normalized_edit_distance": 0.7938144329896907, "word_accuracy": 0.0, "length_ratio": 1.127906976744186, "predicted_length": 97, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6, "edit_distance": 22, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.2631578947368421, "edit_distance": 14, "normalized_edit_distance": 0.7368421052631579, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 2, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.38636363636363635, "edit_distance": 27, "normalized_edit_distance": 0.6136363636363636, "word_accuracy": 0.1111111111111111, "length_ratio": 0.5454545454545454, "predicted_length": 24, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.5, "edit_distance": 24, "normalized_edit_distance": 0.5, "word_accuracy": 0.5, "length_ratio": 0.6666666666666666, "predicted_length": 32, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 40, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 1.3513513513513513, "predicted_length": 50, "ground_truth_length": 37 }, { "character_accuracy": 0.7068965517241379, "edit_distance": 17, "normalized_edit_distance": 0.29310344827586204, "word_accuracy": 0.3333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.2727272727272727, "predicted_length": 12, "ground_truth_length": 44 }, { "character_accuracy": 0.30303030303030304, "edit_distance": 23, "normalized_edit_distance": 0.696969696969697, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 18, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.1, "length_ratio": 0.8333333333333334, "predicted_length": 40, "ground_truth_length": 48 }, { "character_accuracy": 0.5128205128205128, "edit_distance": 19, "normalized_edit_distance": 0.48717948717948717, "word_accuracy": 0.25, "length_ratio": 0.6410256410256411, "predicted_length": 25, "ground_truth_length": 39 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 35, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.5238095238095238, "predicted_length": 22, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.7093023255813954, "edit_distance": 25, "normalized_edit_distance": 0.29069767441860467, "word_accuracy": 0.2777777777777778, "length_ratio": 0.9418604651162791, "predicted_length": 81, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.48717948717948717, "edit_distance": 20, "normalized_edit_distance": 0.5128205128205128, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7692307692307693, "predicted_length": 30, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.21428571428571427, "edit_distance": 11, "normalized_edit_distance": 0.7857142857142857, "word_accuracy": 0.0, "length_ratio": 0.35714285714285715, "predicted_length": 5, "ground_truth_length": 14 }, { "character_accuracy": 0.25, "edit_distance": 24, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.71875, "predicted_length": 23, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.24489795918367346, "edit_distance": 37, "normalized_edit_distance": 0.7551020408163265, "word_accuracy": 0.08333333333333333, "length_ratio": 0.5510204081632653, "predicted_length": 27, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.23952095808383234, "edit_distance": 127, "normalized_edit_distance": 0.7604790419161677, "word_accuracy": 0.0, "length_ratio": 1.7040816326530612, "predicted_length": 167, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.5853658536585366, "edit_distance": 34, "normalized_edit_distance": 0.4146341463414634, "word_accuracy": 0.29411764705882354, "length_ratio": 0.9024390243902439, "predicted_length": 74, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.2222222222222222, "edit_distance": 21, "normalized_edit_distance": 0.7777777777777778, "word_accuracy": 0.2222222222222222, "length_ratio": 1.2272727272727273, "predicted_length": 27, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.2222222222222222, "predicted_length": 8, "ground_truth_length": 36 }, { "character_accuracy": 0.7272727272727273, "edit_distance": 12, "normalized_edit_distance": 0.2727272727272727, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9545454545454546, "predicted_length": 42, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.24603174603174602, "edit_distance": 95, "normalized_edit_distance": 0.753968253968254, "word_accuracy": 0.0, "length_ratio": 1.3263157894736841, "predicted_length": 126, "ground_truth_length": 95 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.125, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.7241379310344828, "edit_distance": 16, "normalized_edit_distance": 0.27586206896551724, "word_accuracy": 0.08333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.25, "edit_distance": 33, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.4772727272727273, "predicted_length": 21, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.14705882352941177, "edit_distance": 29, "normalized_edit_distance": 0.8529411764705882, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 16, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.7222222222222222, "edit_distance": 15, "normalized_edit_distance": 0.2777777777777778, "word_accuracy": 0.2, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.25, "length_ratio": 0.8181818181818182, "predicted_length": 9, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 11, "ground_truth_length": 22 }, { "character_accuracy": 0.2, "edit_distance": 44, "normalized_edit_distance": 0.8, "word_accuracy": 0.15384615384615385, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.4666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.5333333333333333, "word_accuracy": 0.25, "length_ratio": 0.8, "predicted_length": 12, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6545454545454545, "edit_distance": 19, "normalized_edit_distance": 0.34545454545454546, "word_accuracy": 0.08333333333333333, "length_ratio": 0.7636363636363637, "predicted_length": 42, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.23214285714285715, "edit_distance": 129, "normalized_edit_distance": 0.7678571428571429, "word_accuracy": 0.0, "length_ratio": 1.5, "predicted_length": 168, "ground_truth_length": 112 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.3, "length_ratio": 0.8333333333333334, "predicted_length": 40, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.8222222222222222, "edit_distance": 8, "normalized_edit_distance": 0.17777777777777778, "word_accuracy": 0.6, "length_ratio": 0.9555555555555556, "predicted_length": 43, "ground_truth_length": 45 }, { "character_accuracy": 0.86, "edit_distance": 7, "normalized_edit_distance": 0.14, "word_accuracy": 0.5555555555555556, "length_ratio": 0.98, "predicted_length": 49, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.2672413793103448, "edit_distance": 85, "normalized_edit_distance": 0.7327586206896551, "word_accuracy": 0.07142857142857142, "length_ratio": 1.2747252747252746, "predicted_length": 116, "ground_truth_length": 91 }, { "character_accuracy": 0.11764705882352941, "edit_distance": 15, "normalized_edit_distance": 0.8823529411764706, "word_accuracy": 0.0, "length_ratio": 0.29411764705882354, "predicted_length": 5, "ground_truth_length": 17 }, { "character_accuracy": 0.225, "edit_distance": 31, "normalized_edit_distance": 0.775, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 3, "ground_truth_length": 3 }, { "character_accuracy": 0.23214285714285715, "edit_distance": 129, "normalized_edit_distance": 0.7678571428571429, "word_accuracy": 0.0, "length_ratio": 1.6153846153846154, "predicted_length": 168, "ground_truth_length": 104 }, { "character_accuracy": 0.7604166666666666, "edit_distance": 23, "normalized_edit_distance": 0.23958333333333334, "word_accuracy": 0.5263157894736842, "length_ratio": 0.8333333333333334, "predicted_length": 80, "ground_truth_length": 96 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 12, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.7272727272727273, "edit_distance": 12, "normalized_edit_distance": 0.2727272727272727, "word_accuracy": 0.3333333333333333, "length_ratio": 0.8409090909090909, "predicted_length": 37, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 14, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.4, "length_ratio": 0.6538461538461539, "predicted_length": 17, "ground_truth_length": 26 }, { "character_accuracy": 0.5625, "edit_distance": 7, "normalized_edit_distance": 0.4375, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 12, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.9333333333333333, "edit_distance": 4, "normalized_edit_distance": 0.06666666666666667, "word_accuracy": 0.7272727272727273, "length_ratio": 1.0169491525423728, "predicted_length": 60, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 15, "ground_truth_length": 33 }, { "character_accuracy": 0.11320754716981132, "edit_distance": 47, "normalized_edit_distance": 0.8867924528301887, "word_accuracy": 0.0, "length_ratio": 0.3584905660377358, "predicted_length": 19, "ground_truth_length": 53 }, { "character_accuracy": 0.9016393442622951, "edit_distance": 6, "normalized_edit_distance": 0.09836065573770492, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9836065573770492, "predicted_length": 60, "ground_truth_length": 61 } ] }, { "step": 5000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:34:46.508411", "loss": 0.7357740467786789, "perplexity": 2.087096929550171, "min_loss": 0.3380905091762543, "max_loss": 1.4315803050994873, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.4040487895262258, "avg_word_accuracy": 0.20475821400821398, "avg_edit_distance": 21.57, "avg_normalized_edit_distance": 0.5959512104737743, "avg_length_ratio": 0.7426856301416462, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.8, "edit_distance": 2, "normalized_edit_distance": 0.2, "word_accuracy": 0.3333333333333333, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.7735849056603774, "edit_distance": 12, "normalized_edit_distance": 0.22641509433962265, "word_accuracy": 0.23076923076923078, "length_ratio": 0.8679245283018868, "predicted_length": 46, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.20618556701030927, "edit_distance": 77, "normalized_edit_distance": 0.7938144329896907, "word_accuracy": 0.0, "length_ratio": 1.127906976744186, "predicted_length": 97, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.5818181818181818, "edit_distance": 23, "normalized_edit_distance": 0.41818181818181815, "word_accuracy": 0.0, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.7380952380952381, "predicted_length": 31, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.14285714285714285, "predicted_length": 1, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.1590909090909091, "edit_distance": 37, "normalized_edit_distance": 0.8409090909090909, "word_accuracy": 0.0, "length_ratio": 0.4090909090909091, "predicted_length": 18, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.1896551724137931, "edit_distance": 47, "normalized_edit_distance": 0.8103448275862069, "word_accuracy": 0.06666666666666667, "length_ratio": 1.0545454545454545, "predicted_length": 58, "ground_truth_length": 55 }, { "character_accuracy": 0.5, "edit_distance": 24, "normalized_edit_distance": 0.5, "word_accuracy": 0.4, "length_ratio": 0.6041666666666666, "predicted_length": 29, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.21621621621621623, "edit_distance": 29, "normalized_edit_distance": 0.7837837837837838, "word_accuracy": 0.0, "length_ratio": 0.6756756756756757, "predicted_length": 25, "ground_truth_length": 37 }, { "character_accuracy": 0.3103448275862069, "edit_distance": 40, "normalized_edit_distance": 0.6896551724137931, "word_accuracy": 0.0, "length_ratio": 0.8793103448275862, "predicted_length": 51, "ground_truth_length": 58 }, { "character_accuracy": 0.20454545454545456, "edit_distance": 35, "normalized_edit_distance": 0.7954545454545454, "word_accuracy": 0.375, "length_ratio": 0.4772727272727273, "predicted_length": 21, "ground_truth_length": 44 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 27, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 11, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.2, "length_ratio": 0.8958333333333334, "predicted_length": 43, "ground_truth_length": 48 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 13, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.2222222222222222, "length_ratio": 0.7948717948717948, "predicted_length": 31, "ground_truth_length": 39 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 35, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.5238095238095238, "predicted_length": 22, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.5378151260504201, "edit_distance": 55, "normalized_edit_distance": 0.46218487394957986, "word_accuracy": 0.25, "length_ratio": 1.3837209302325582, "predicted_length": 119, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.5641025641025641, "edit_distance": 17, "normalized_edit_distance": 0.4358974358974359, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8205128205128205, "predicted_length": 32, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.2857142857142857, "edit_distance": 10, "normalized_edit_distance": 0.7142857142857143, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 6, "ground_truth_length": 14 }, { "character_accuracy": 0.28125, "edit_distance": 23, "normalized_edit_distance": 0.71875, "word_accuracy": 0.0, "length_ratio": 0.96875, "predicted_length": 31, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8979591836734694, "edit_distance": 5, "normalized_edit_distance": 0.10204081632653061, "word_accuracy": 0.6, "length_ratio": 0.9591836734693877, "predicted_length": 47, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.23952095808383234, "edit_distance": 127, "normalized_edit_distance": 0.7604790419161677, "word_accuracy": 0.0, "length_ratio": 1.7040816326530612, "predicted_length": 167, "ground_truth_length": 98 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.17391304347826086, "edit_distance": 19, "normalized_edit_distance": 0.8260869565217391, "word_accuracy": 0.1111111111111111, "length_ratio": 1.0454545454545454, "predicted_length": 23, "ground_truth_length": 22 }, { "character_accuracy": 0.027777777777777776, "edit_distance": 35, "normalized_edit_distance": 0.9722222222222222, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 9, "ground_truth_length": 36 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.23958333333333334, "edit_distance": 73, "normalized_edit_distance": 0.7604166666666666, "word_accuracy": 0.0, "length_ratio": 1.0105263157894737, "predicted_length": 96, "ground_truth_length": 95 }, { "character_accuracy": 0.24324324324324326, "edit_distance": 28, "normalized_edit_distance": 0.7567567567567568, "word_accuracy": 0.0, "length_ratio": 0.6486486486486487, "predicted_length": 24, "ground_truth_length": 37 }, { "character_accuracy": 0.7241379310344828, "edit_distance": 16, "normalized_edit_distance": 0.27586206896551724, "word_accuracy": 0.08333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.3181818181818182, "edit_distance": 30, "normalized_edit_distance": 0.6818181818181818, "word_accuracy": 0.0, "length_ratio": 0.6590909090909091, "predicted_length": 29, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 6, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.7272727272727273, "length_ratio": 0.9629629629629629, "predicted_length": 52, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 9, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.25, "length_ratio": 0.8181818181818182, "predicted_length": 9, "ground_truth_length": 11 }, { "character_accuracy": 0.5154639175257731, "edit_distance": 47, "normalized_edit_distance": 0.4845360824742268, "word_accuracy": 0.42857142857142855, "length_ratio": 0.7628865979381443, "predicted_length": 74, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 20, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 5, "ground_truth_length": 22 }, { "character_accuracy": 0.2542372881355932, "edit_distance": 44, "normalized_edit_distance": 0.7457627118644068, "word_accuracy": 0.0, "length_ratio": 1.0727272727272728, "predicted_length": 59, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 10, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.25, "length_ratio": 0.6, "predicted_length": 9, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.8727272727272727, "edit_distance": 7, "normalized_edit_distance": 0.12727272727272726, "word_accuracy": 0.3333333333333333, "length_ratio": 1.0, "predicted_length": 55, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.3125, "edit_distance": 77, "normalized_edit_distance": 0.6875, "word_accuracy": 0.041666666666666664, "length_ratio": 0.8125, "predicted_length": 91, "ground_truth_length": 112 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.5555555555555556, "length_ratio": 0.875, "predicted_length": 42, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.8222222222222222, "edit_distance": 8, "normalized_edit_distance": 0.17777777777777778, "word_accuracy": 0.6, "length_ratio": 0.9555555555555556, "predicted_length": 43, "ground_truth_length": 45 }, { "character_accuracy": 0.9, "edit_distance": 5, "normalized_edit_distance": 0.1, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.5257731958762887, "edit_distance": 46, "normalized_edit_distance": 0.4742268041237113, "word_accuracy": 0.22727272727272727, "length_ratio": 1.065934065934066, "predicted_length": 97, "ground_truth_length": 91 }, { "character_accuracy": 0.29411764705882354, "edit_distance": 12, "normalized_edit_distance": 0.7058823529411765, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.225, "edit_distance": 31, "normalized_edit_distance": 0.775, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 16, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 3, "ground_truth_length": 3 }, { "character_accuracy": 0.22580645161290322, "edit_distance": 120, "normalized_edit_distance": 0.7741935483870968, "word_accuracy": 0.0, "length_ratio": 1.4903846153846154, "predicted_length": 155, "ground_truth_length": 104 }, { "character_accuracy": 0.24043715846994534, "edit_distance": 139, "normalized_edit_distance": 0.7595628415300546, "word_accuracy": 0.0, "length_ratio": 1.90625, "predicted_length": 183, "ground_truth_length": 96 }, { "character_accuracy": 0.7142857142857143, "edit_distance": 12, "normalized_edit_distance": 0.2857142857142857, "word_accuracy": 0.7777777777777778, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.8181818181818182, "edit_distance": 8, "normalized_edit_distance": 0.18181818181818182, "word_accuracy": 0.5, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 14, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.4, "length_ratio": 0.6538461538461539, "predicted_length": 17, "ground_truth_length": 26 }, { "character_accuracy": 0.375, "edit_distance": 10, "normalized_edit_distance": 0.625, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.9333333333333333, "edit_distance": 4, "normalized_edit_distance": 0.06666666666666667, "word_accuracy": 0.7272727272727273, "length_ratio": 1.0169491525423728, "predicted_length": 60, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 15, "ground_truth_length": 33 }, { "character_accuracy": 0.4716981132075472, "edit_distance": 28, "normalized_edit_distance": 0.5283018867924528, "word_accuracy": 0.15384615384615385, "length_ratio": 0.6981132075471698, "predicted_length": 37, "ground_truth_length": 53 }, { "character_accuracy": 0.9016393442622951, "edit_distance": 6, "normalized_edit_distance": 0.09836065573770492, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9836065573770492, "predicted_length": 60, "ground_truth_length": 61 } ] }, { "step": 5500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:35:57.487710", "loss": 0.732145220041275, "perplexity": 2.0795369148254395, "min_loss": 0.3273903727531433, "max_loss": 1.3533048629760742, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.38061094014940244, "avg_word_accuracy": 0.18906373171704974, "avg_edit_distance": 20.81, "avg_normalized_edit_distance": 0.6193890598505974, "avg_length_ratio": 0.6973468802703299, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 3, "ground_truth_length": 10 }, { "character_accuracy": 0.2641509433962264, "edit_distance": 39, "normalized_edit_distance": 0.7358490566037735, "word_accuracy": 0.0, "length_ratio": 0.4716981132075472, "predicted_length": 25, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.12790697674418605, "edit_distance": 75, "normalized_edit_distance": 0.872093023255814, "word_accuracy": 0.06666666666666667, "length_ratio": 0.6627906976744186, "predicted_length": 57, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.4909090909090909, "edit_distance": 28, "normalized_edit_distance": 0.509090909090909, "word_accuracy": 0.0, "length_ratio": 0.6727272727272727, "predicted_length": 37, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.7380952380952381, "predicted_length": 31, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.5294117647058824, "predicted_length": 9, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.14285714285714285, "predicted_length": 1, "ground_truth_length": 7 }, { "character_accuracy": 0.9215686274509803, "edit_distance": 4, "normalized_edit_distance": 0.0784313725490196, "word_accuracy": 0.6363636363636364, "length_ratio": 1.0, "predicted_length": 51, "ground_truth_length": 51 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 40, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3409090909090909, "predicted_length": 15, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.5, "edit_distance": 24, "normalized_edit_distance": 0.5, "word_accuracy": 0.5, "length_ratio": 0.6666666666666666, "predicted_length": 32, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.40540540540540543, "edit_distance": 22, "normalized_edit_distance": 0.5945945945945946, "word_accuracy": 0.0, "length_ratio": 0.7027027027027027, "predicted_length": 26, "ground_truth_length": 37 }, { "character_accuracy": 0.7068965517241379, "edit_distance": 17, "normalized_edit_distance": 0.29310344827586204, "word_accuracy": 0.3333333333333333, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 38, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.1, "length_ratio": 0.4318181818181818, "predicted_length": 19, "ground_truth_length": 44 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.5757575757575758, "predicted_length": 19, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.1282051282051282, "edit_distance": 34, "normalized_edit_distance": 0.8717948717948718, "word_accuracy": 0.0, "length_ratio": 0.7435897435897436, "predicted_length": 29, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 42, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.38095238095238093, "predicted_length": 16, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8837209302325582, "edit_distance": 10, "normalized_edit_distance": 0.11627906976744186, "word_accuracy": 0.5714285714285714, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.42105263157894735, "edit_distance": 55, "normalized_edit_distance": 0.5789473684210527, "word_accuracy": 0.13043478260869565, "length_ratio": 0.8315789473684211, "predicted_length": 79, "ground_truth_length": 95 }, { "character_accuracy": 0.7435897435897436, "edit_distance": 10, "normalized_edit_distance": 0.2564102564102564, "word_accuracy": 0.4444444444444444, "length_ratio": 0.7948717948717948, "predicted_length": 31, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.0, "edit_distance": 14, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 7, "ground_truth_length": 14 }, { "character_accuracy": 0.21875, "edit_distance": 25, "normalized_edit_distance": 0.78125, "word_accuracy": 0.0, "length_ratio": 0.8125, "predicted_length": 26, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 42, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.8775510204081632, "predicted_length": 43, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.20202020202020202, "edit_distance": 79, "normalized_edit_distance": 0.797979797979798, "word_accuracy": 0.0, "length_ratio": 1.010204081632653, "predicted_length": 99, "ground_truth_length": 98 }, { "character_accuracy": 0.6, "edit_distance": 4, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.18421052631578946, "edit_distance": 31, "normalized_edit_distance": 0.8157894736842105, "word_accuracy": 0.07692307692307693, "length_ratio": 1.7272727272727273, "predicted_length": 38, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 9, "ground_truth_length": 36 }, { "character_accuracy": 0.75, "edit_distance": 11, "normalized_edit_distance": 0.25, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.9375, "edit_distance": 4, "normalized_edit_distance": 0.0625, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 64, "ground_truth_length": 64 }, { "character_accuracy": 0.31666666666666665, "edit_distance": 82, "normalized_edit_distance": 0.6833333333333333, "word_accuracy": 0.0, "length_ratio": 1.263157894736842, "predicted_length": 120, "ground_truth_length": 95 }, { "character_accuracy": 0.21621621621621623, "edit_distance": 29, "normalized_edit_distance": 0.7837837837837838, "word_accuracy": 0.0, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.7758620689655172, "edit_distance": 13, "normalized_edit_distance": 0.22413793103448276, "word_accuracy": 0.0, "length_ratio": 0.9482758620689655, "predicted_length": 55, "ground_truth_length": 58 }, { "character_accuracy": 0.045454545454545456, "edit_distance": 42, "normalized_edit_distance": 0.9545454545454546, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 14, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8235294117647058, "predicted_length": 28, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 18, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.2, "length_ratio": 1.0, "predicted_length": 54, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 5, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.05, "edit_distance": 19, "normalized_edit_distance": 0.95, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 5, "ground_truth_length": 20 }, { "character_accuracy": 0.8041237113402062, "edit_distance": 19, "normalized_edit_distance": 0.1958762886597938, "word_accuracy": 0.6, "length_ratio": 0.8969072164948454, "predicted_length": 87, "ground_truth_length": 97 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 8, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.27, "edit_distance": 73, "normalized_edit_distance": 0.73, "word_accuracy": 0.375, "length_ratio": 1.0309278350515463, "predicted_length": 100, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.09090909090909091, "edit_distance": 20, "normalized_edit_distance": 0.9090909090909091, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 7, "ground_truth_length": 22 }, { "character_accuracy": 0.7818181818181819, "edit_distance": 12, "normalized_edit_distance": 0.21818181818181817, "word_accuracy": 0.5454545454545454, "length_ratio": 0.8545454545454545, "predicted_length": 47, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 5, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 10, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.25, "length_ratio": 0.6, "predicted_length": 9, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.4, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.2185792349726776, "edit_distance": 143, "normalized_edit_distance": 0.7814207650273224, "word_accuracy": 0.0, "length_ratio": 1.6339285714285714, "predicted_length": 183, "ground_truth_length": 112 }, { "character_accuracy": 0.14583333333333334, "edit_distance": 41, "normalized_edit_distance": 0.8541666666666666, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 16, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.6875, "edit_distance": 15, "normalized_edit_distance": 0.3125, "word_accuracy": 0.45454545454545453, "length_ratio": 1.0666666666666667, "predicted_length": 48, "ground_truth_length": 45 }, { "character_accuracy": 0.84, "edit_distance": 8, "normalized_edit_distance": 0.16, "word_accuracy": 0.5555555555555556, "length_ratio": 0.98, "predicted_length": 49, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.2601626016260163, "edit_distance": 91, "normalized_edit_distance": 0.7398373983739838, "word_accuracy": 0.07142857142857142, "length_ratio": 1.3516483516483517, "predicted_length": 123, "ground_truth_length": 91 }, { "character_accuracy": 0.29411764705882354, "edit_distance": 12, "normalized_edit_distance": 0.7058823529411765, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.15, "edit_distance": 34, "normalized_edit_distance": 0.85, "word_accuracy": 0.0, "length_ratio": 0.35, "predicted_length": 14, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.2, "edit_distance": 88, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 1.0576923076923077, "predicted_length": 110, "ground_truth_length": 104 }, { "character_accuracy": 0.7604166666666666, "edit_distance": 23, "normalized_edit_distance": 0.23958333333333334, "word_accuracy": 0.5263157894736842, "length_ratio": 0.8333333333333334, "predicted_length": 80, "ground_truth_length": 96 }, { "character_accuracy": 0.5476190476190477, "edit_distance": 19, "normalized_edit_distance": 0.4523809523809524, "word_accuracy": 0.45454545454545453, "length_ratio": 0.8333333333333334, "predicted_length": 35, "ground_truth_length": 42 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.375, "length_ratio": 0.7954545454545454, "predicted_length": 35, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.46153846153846156, "edit_distance": 14, "normalized_edit_distance": 0.5384615384615384, "word_accuracy": 0.4, "length_ratio": 0.6538461538461539, "predicted_length": 17, "ground_truth_length": 26 }, { "character_accuracy": 0.375, "edit_distance": 10, "normalized_edit_distance": 0.625, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8135593220338984, "edit_distance": 11, "normalized_edit_distance": 0.1864406779661017, "word_accuracy": 0.5, "length_ratio": 0.9152542372881356, "predicted_length": 54, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 15, "ground_truth_length": 33 }, { "character_accuracy": 0.18867924528301888, "edit_distance": 43, "normalized_edit_distance": 0.8113207547169812, "word_accuracy": 0.2, "length_ratio": 0.5471698113207547, "predicted_length": 29, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 6000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:37:08.212937", "loss": 0.7276217466592789, "perplexity": 2.0701513290405273, "min_loss": 0.35830122232437134, "max_loss": 1.334588885307312, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.3881718837882011, "avg_word_accuracy": 0.1760970395101974, "avg_edit_distance": 22.64, "avg_normalized_edit_distance": 0.6118281162117989, "avg_length_ratio": 0.715380332049047, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.6415094339622641, "edit_distance": 19, "normalized_edit_distance": 0.3584905660377358, "word_accuracy": 0.4, "length_ratio": 0.7735849056603774, "predicted_length": 41, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.12790697674418605, "edit_distance": 75, "normalized_edit_distance": 0.872093023255814, "word_accuracy": 0.06666666666666667, "length_ratio": 0.6627906976744186, "predicted_length": 57, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6, "edit_distance": 22, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.5714285714285714, "edit_distance": 3, "normalized_edit_distance": 0.42857142857142855, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.6904761904761905, "predicted_length": 29, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.14285714285714285, "predicted_length": 1, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.3409090909090909, "edit_distance": 29, "normalized_edit_distance": 0.6590909090909091, "word_accuracy": 0.0, "length_ratio": 0.6363636363636364, "predicted_length": 28, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.4583333333333333, "edit_distance": 26, "normalized_edit_distance": 0.5416666666666666, "word_accuracy": 0.36363636363636365, "length_ratio": 0.625, "predicted_length": 30, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.32432432432432434, "edit_distance": 25, "normalized_edit_distance": 0.6756756756756757, "word_accuracy": 0.1111111111111111, "length_ratio": 0.7567567567567568, "predicted_length": 28, "ground_truth_length": 37 }, { "character_accuracy": 0.4482758620689655, "edit_distance": 32, "normalized_edit_distance": 0.5517241379310345, "word_accuracy": 0.0, "length_ratio": 0.7758620689655172, "predicted_length": 45, "ground_truth_length": 58 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 38, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.1, "length_ratio": 0.4318181818181818, "predicted_length": 19, "ground_truth_length": 44 }, { "character_accuracy": 0.12121212121212122, "edit_distance": 29, "normalized_edit_distance": 0.8787878787878788, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 22, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.1282051282051282, "edit_distance": 34, "normalized_edit_distance": 0.8717948717948718, "word_accuracy": 0.0, "length_ratio": 0.7435897435897436, "predicted_length": 29, "ground_truth_length": 39 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 36, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.40476190476190477, "predicted_length": 17, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8837209302325582, "edit_distance": 10, "normalized_edit_distance": 0.11627906976744186, "word_accuracy": 0.5714285714285714, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.7435897435897436, "edit_distance": 10, "normalized_edit_distance": 0.2564102564102564, "word_accuracy": 0.4444444444444444, "length_ratio": 0.7948717948717948, "predicted_length": 31, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.0, "edit_distance": 14, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 7, "ground_truth_length": 14 }, { "character_accuracy": 0.25, "edit_distance": 24, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.71875, "predicted_length": 23, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.20408163265306123, "edit_distance": 39, "normalized_edit_distance": 0.7959183673469388, "word_accuracy": 0.0, "length_ratio": 0.5306122448979592, "predicted_length": 26, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.208, "edit_distance": 99, "normalized_edit_distance": 0.792, "word_accuracy": 0.0, "length_ratio": 1.2755102040816326, "predicted_length": 125, "ground_truth_length": 98 }, { "character_accuracy": 0.6, "edit_distance": 4, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.20512820512820512, "edit_distance": 31, "normalized_edit_distance": 0.7948717948717948, "word_accuracy": 0.16666666666666666, "length_ratio": 1.7727272727272727, "predicted_length": 39, "ground_truth_length": 22 }, { "character_accuracy": 0.1111111111111111, "edit_distance": 32, "normalized_edit_distance": 0.8888888888888888, "word_accuracy": 0.0, "length_ratio": 0.2777777777777778, "predicted_length": 10, "ground_truth_length": 36 }, { "character_accuracy": 0.7727272727272727, "edit_distance": 10, "normalized_edit_distance": 0.22727272727272727, "word_accuracy": 0.3, "length_ratio": 0.9318181818181818, "predicted_length": 41, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.2636363636363636, "edit_distance": 81, "normalized_edit_distance": 0.7363636363636363, "word_accuracy": 0.0, "length_ratio": 1.1578947368421053, "predicted_length": 110, "ground_truth_length": 95 }, { "character_accuracy": 0.21621621621621623, "edit_distance": 29, "normalized_edit_distance": 0.7837837837837838, "word_accuracy": 0.0, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.7413793103448276, "edit_distance": 15, "normalized_edit_distance": 0.25862068965517243, "word_accuracy": 0.0, "length_ratio": 0.9482758620689655, "predicted_length": 55, "ground_truth_length": 58 }, { "character_accuracy": 0.045454545454545456, "edit_distance": 42, "normalized_edit_distance": 0.9545454545454546, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 14, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.6176470588235294, "edit_distance": 13, "normalized_edit_distance": 0.38235294117647056, "word_accuracy": 0.375, "length_ratio": 0.8529411764705882, "predicted_length": 29, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.7777777777777778, "edit_distance": 12, "normalized_edit_distance": 0.2222222222222222, "word_accuracy": 0.35714285714285715, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.2, "edit_distance": 16, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 8, "ground_truth_length": 20 }, { "character_accuracy": 0.2570093457943925, "edit_distance": 159, "normalized_edit_distance": 0.7429906542056075, "word_accuracy": 0.0, "length_ratio": 2.2061855670103094, "predicted_length": 214, "ground_truth_length": 97 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 8, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 7, "ground_truth_length": 22 }, { "character_accuracy": 0.234375, "edit_distance": 49, "normalized_edit_distance": 0.765625, "word_accuracy": 0.05263157894736842, "length_ratio": 1.1636363636363636, "predicted_length": 64, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 5, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 10, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.25, "length_ratio": 0.6, "predicted_length": 9, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6727272727272727, "edit_distance": 18, "normalized_edit_distance": 0.32727272727272727, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.23214285714285715, "edit_distance": 129, "normalized_edit_distance": 0.7678571428571429, "word_accuracy": 0.0, "length_ratio": 1.5, "predicted_length": 168, "ground_truth_length": 112 }, { "character_accuracy": 0.14583333333333334, "edit_distance": 41, "normalized_edit_distance": 0.8541666666666666, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 16, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.8, "edit_distance": 9, "normalized_edit_distance": 0.2, "word_accuracy": 0.5, "length_ratio": 0.9333333333333333, "predicted_length": 42, "ground_truth_length": 45 }, { "character_accuracy": 0.9, "edit_distance": 5, "normalized_edit_distance": 0.1, "word_accuracy": 0.5555555555555556, "length_ratio": 1.0, "predicted_length": 50, "ground_truth_length": 50 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.8571428571428571, "predicted_length": 6, "ground_truth_length": 7 }, { "character_accuracy": 0.20212765957446807, "edit_distance": 75, "normalized_edit_distance": 0.7978723404255319, "word_accuracy": 0.0, "length_ratio": 1.032967032967033, "predicted_length": 94, "ground_truth_length": 91 }, { "character_accuracy": 0.29411764705882354, "edit_distance": 12, "normalized_edit_distance": 0.7058823529411765, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.35, "edit_distance": 26, "normalized_edit_distance": 0.65, "word_accuracy": 0.0, "length_ratio": 0.65, "predicted_length": 26, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.7980769230769231, "edit_distance": 21, "normalized_edit_distance": 0.20192307692307693, "word_accuracy": 0.65, "length_ratio": 0.875, "predicted_length": 91, "ground_truth_length": 104 }, { "character_accuracy": 0.22009569377990432, "edit_distance": 163, "normalized_edit_distance": 0.7799043062200957, "word_accuracy": 0.0, "length_ratio": 2.1770833333333335, "predicted_length": 209, "ground_truth_length": 96 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.30952380952380953, "predicted_length": 13, "ground_truth_length": 42 }, { "character_accuracy": 0.75, "edit_distance": 11, "normalized_edit_distance": 0.25, "word_accuracy": 0.5, "length_ratio": 0.8409090909090909, "predicted_length": 37, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.3076923076923077, "edit_distance": 18, "normalized_edit_distance": 0.6923076923076923, "word_accuracy": 0.0, "length_ratio": 0.6153846153846154, "predicted_length": 16, "ground_truth_length": 26 }, { "character_accuracy": 0.4375, "edit_distance": 9, "normalized_edit_distance": 0.5625, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8135593220338984, "edit_distance": 11, "normalized_edit_distance": 0.1864406779661017, "word_accuracy": 0.5, "length_ratio": 0.9152542372881356, "predicted_length": 54, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.45454545454545453, "predicted_length": 15, "ground_truth_length": 33 }, { "character_accuracy": 0.4528301886792453, "edit_distance": 29, "normalized_edit_distance": 0.5471698113207547, "word_accuracy": 0.15384615384615385, "length_ratio": 0.7358490566037735, "predicted_length": 39, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 6500, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:38:19.950782", "loss": 0.7189941531419755, "perplexity": 2.052367687225342, "min_loss": 0.3358589708805084, "max_loss": 1.3528335094451904, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.4150271383000453, "avg_word_accuracy": 0.18908734724616405, "avg_edit_distance": 21.03, "avg_normalized_edit_distance": 0.5849728616999549, "avg_length_ratio": 0.7355334487384781, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.8, "edit_distance": 2, "normalized_edit_distance": 0.2, "word_accuracy": 0.3333333333333333, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.6415094339622641, "edit_distance": 19, "normalized_edit_distance": 0.3584905660377358, "word_accuracy": 0.4, "length_ratio": 0.7735849056603774, "predicted_length": 41, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.12790697674418605, "edit_distance": 75, "normalized_edit_distance": 0.872093023255814, "word_accuracy": 0.06666666666666667, "length_ratio": 0.6627906976744186, "predicted_length": 57, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6, "edit_distance": 22, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.5714285714285714, "edit_distance": 3, "normalized_edit_distance": 0.42857142857142855, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.40476190476190477, "edit_distance": 25, "normalized_edit_distance": 0.5952380952380952, "word_accuracy": 0.0, "length_ratio": 0.7619047619047619, "predicted_length": 32, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.6862745098039216, "edit_distance": 16, "normalized_edit_distance": 0.3137254901960784, "word_accuracy": 0.4166666666666667, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.38636363636363635, "edit_distance": 27, "normalized_edit_distance": 0.6136363636363636, "word_accuracy": 0.1111111111111111, "length_ratio": 0.5454545454545454, "predicted_length": 24, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.4375, "edit_distance": 27, "normalized_edit_distance": 0.5625, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6041666666666666, "predicted_length": 29, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.24324324324324326, "edit_distance": 28, "normalized_edit_distance": 0.7567567567567568, "word_accuracy": 0.0, "length_ratio": 0.6756756756756757, "predicted_length": 25, "ground_truth_length": 37 }, { "character_accuracy": 0.39655172413793105, "edit_distance": 35, "normalized_edit_distance": 0.603448275862069, "word_accuracy": 0.0, "length_ratio": 0.7758620689655172, "predicted_length": 45, "ground_truth_length": 58 }, { "character_accuracy": 0.06818181818181818, "edit_distance": 41, "normalized_edit_distance": 0.9318181818181818, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 10, "ground_truth_length": 44 }, { "character_accuracy": 0.15151515151515152, "edit_distance": 28, "normalized_edit_distance": 0.8484848484848485, "word_accuracy": 0.0, "length_ratio": 0.5454545454545454, "predicted_length": 18, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.717948717948718, "edit_distance": 11, "normalized_edit_distance": 0.28205128205128205, "word_accuracy": 0.2, "length_ratio": 0.9487179487179487, "predicted_length": 37, "ground_truth_length": 39 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.07692307692307693, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8837209302325582, "edit_distance": 10, "normalized_edit_distance": 0.11627906976744186, "word_accuracy": 0.5714285714285714, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.9368421052631579, "edit_distance": 6, "normalized_edit_distance": 0.06315789473684211, "word_accuracy": 0.8666666666666667, "length_ratio": 0.9789473684210527, "predicted_length": 93, "ground_truth_length": 95 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 13, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.3333333333333333, "length_ratio": 0.7435897435897436, "predicted_length": 29, "ground_truth_length": 39 }, { "character_accuracy": 0.9411764705882353, "edit_distance": 4, "normalized_edit_distance": 0.058823529411764705, "word_accuracy": 0.5714285714285714, "length_ratio": 1.0, "predicted_length": 68, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 12, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.2857142857142857, "predicted_length": 4, "ground_truth_length": 14 }, { "character_accuracy": 0.21875, "edit_distance": 25, "normalized_edit_distance": 0.78125, "word_accuracy": 0.0, "length_ratio": 0.78125, "predicted_length": 25, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 42, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.8775510204081632, "predicted_length": 43, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.208, "edit_distance": 99, "normalized_edit_distance": 0.792, "word_accuracy": 0.0, "length_ratio": 1.2755102040816326, "predicted_length": 125, "ground_truth_length": 98 }, { "character_accuracy": 0.6, "edit_distance": 4, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.5975609756097561, "edit_distance": 33, "normalized_edit_distance": 0.4024390243902439, "word_accuracy": 0.29411764705882354, "length_ratio": 0.8536585365853658, "predicted_length": 70, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.18421052631578946, "edit_distance": 31, "normalized_edit_distance": 0.8157894736842105, "word_accuracy": 0.07692307692307693, "length_ratio": 1.7272727272727273, "predicted_length": 38, "ground_truth_length": 22 }, { "character_accuracy": 0.75, "edit_distance": 9, "normalized_edit_distance": 0.25, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8611111111111112, "predicted_length": 31, "ground_truth_length": 36 }, { "character_accuracy": 0.7272727272727273, "edit_distance": 12, "normalized_edit_distance": 0.2727272727272727, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9318181818181818, "predicted_length": 41, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5625, "edit_distance": 28, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.6875, "predicted_length": 44, "ground_truth_length": 64 }, { "character_accuracy": 0.23958333333333334, "edit_distance": 73, "normalized_edit_distance": 0.7604166666666666, "word_accuracy": 0.0, "length_ratio": 1.0105263157894737, "predicted_length": 96, "ground_truth_length": 95 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.0, "length_ratio": 0.5405405405405406, "predicted_length": 20, "ground_truth_length": 37 }, { "character_accuracy": 0.7586206896551724, "edit_distance": 14, "normalized_edit_distance": 0.2413793103448276, "word_accuracy": 0.09090909090909091, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.4772727272727273, "edit_distance": 23, "normalized_edit_distance": 0.5227272727272727, "word_accuracy": 0.0, "length_ratio": 0.6818181818181818, "predicted_length": 30, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.5882352941176471, "edit_distance": 14, "normalized_edit_distance": 0.4117647058823529, "word_accuracy": 0.42857142857142855, "length_ratio": 0.7647058823529411, "predicted_length": 26, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8148148148148148, "edit_distance": 10, "normalized_edit_distance": 0.18518518518518517, "word_accuracy": 0.26666666666666666, "length_ratio": 0.9814814814814815, "predicted_length": 53, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 3, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.3, "edit_distance": 14, "normalized_edit_distance": 0.7, "word_accuracy": 0.0, "length_ratio": 0.65, "predicted_length": 13, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 8, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 19, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.3181818181818182, "predicted_length": 7, "ground_truth_length": 22 }, { "character_accuracy": 0.26229508196721313, "edit_distance": 45, "normalized_edit_distance": 0.7377049180327869, "word_accuracy": 0.0, "length_ratio": 1.1090909090909091, "predicted_length": 61, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.125, "predicted_length": 1, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.13333333333333333, "edit_distance": 13, "normalized_edit_distance": 0.8666666666666667, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 6, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.4, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.23214285714285715, "edit_distance": 129, "normalized_edit_distance": 0.7678571428571429, "word_accuracy": 0.0, "length_ratio": 1.5, "predicted_length": 168, "ground_truth_length": 112 }, { "character_accuracy": 0.5625, "edit_distance": 21, "normalized_edit_distance": 0.4375, "word_accuracy": 0.3, "length_ratio": 0.7708333333333334, "predicted_length": 37, "ground_truth_length": 48 }, { "character_accuracy": 0.4375, "edit_distance": 9, "normalized_edit_distance": 0.5625, "word_accuracy": 0.0, "length_ratio": 0.625, "predicted_length": 10, "ground_truth_length": 16 }, { "character_accuracy": 0.8222222222222222, "edit_distance": 8, "normalized_edit_distance": 0.17777777777777778, "word_accuracy": 0.6, "length_ratio": 0.9555555555555556, "predicted_length": 43, "ground_truth_length": 45 }, { "character_accuracy": 0.84, "edit_distance": 8, "normalized_edit_distance": 0.16, "word_accuracy": 0.5555555555555556, "length_ratio": 0.98, "predicted_length": 49, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.5384615384615384, "edit_distance": 42, "normalized_edit_distance": 0.46153846153846156, "word_accuracy": 0.08695652173913043, "length_ratio": 0.9340659340659341, "predicted_length": 85, "ground_truth_length": 91 }, { "character_accuracy": 0.29411764705882354, "edit_distance": 12, "normalized_edit_distance": 0.7058823529411765, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.275, "edit_distance": 29, "normalized_edit_distance": 0.725, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 20, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 128, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 1.6538461538461537, "predicted_length": 172, "ground_truth_length": 104 }, { "character_accuracy": 0.7604166666666666, "edit_distance": 23, "normalized_edit_distance": 0.23958333333333334, "word_accuracy": 0.5263157894736842, "length_ratio": 0.8333333333333334, "predicted_length": 80, "ground_truth_length": 96 }, { "character_accuracy": 0.8095238095238095, "edit_distance": 8, "normalized_edit_distance": 0.19047619047619047, "word_accuracy": 0.5454545454545454, "length_ratio": 0.9761904761904762, "predicted_length": 41, "ground_truth_length": 42 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.375, "length_ratio": 0.7954545454545454, "predicted_length": 35, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.23076923076923078, "edit_distance": 20, "normalized_edit_distance": 0.7692307692307693, "word_accuracy": 0.0, "length_ratio": 0.5384615384615384, "predicted_length": 14, "ground_truth_length": 26 }, { "character_accuracy": 0.5625, "edit_distance": 7, "normalized_edit_distance": 0.4375, "word_accuracy": 0.0, "length_ratio": 0.75, "predicted_length": 12, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8135593220338984, "edit_distance": 11, "normalized_edit_distance": 0.1864406779661017, "word_accuracy": 0.5, "length_ratio": 0.9152542372881356, "predicted_length": 54, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 27, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.36363636363636365, "predicted_length": 12, "ground_truth_length": 33 }, { "character_accuracy": 0.22641509433962265, "edit_distance": 41, "normalized_edit_distance": 0.7735849056603774, "word_accuracy": 0.4444444444444444, "length_ratio": 0.6226415094339622, "predicted_length": 33, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] }, { "step": 7000, "checkpoint_type": "checkpoint", "timestamp": "2025-08-18T20:39:31.268042", "loss": 0.7223658800125122, "perplexity": 2.0592994689941406, "min_loss": 0.3865942060947418, "max_loss": 1.3336049318313599, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.41553718527220956, "avg_word_accuracy": 0.18711077811077811, "avg_edit_distance": 19.57, "avg_normalized_edit_distance": 0.5844628147277905, "avg_length_ratio": 0.7199628293282676, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3, "predicted_length": 3, "ground_truth_length": 10 }, { "character_accuracy": 0.5094339622641509, "edit_distance": 26, "normalized_edit_distance": 0.49056603773584906, "word_accuracy": 0.15384615384615385, "length_ratio": 0.6981132075471698, "predicted_length": 37, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.2, "edit_distance": 76, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 1.1046511627906976, "predicted_length": 95, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.41818181818181815, "edit_distance": 32, "normalized_edit_distance": 0.5818181818181818, "word_accuracy": 0.0, "length_ratio": 0.6181818181818182, "predicted_length": 34, "ground_truth_length": 55 }, { "character_accuracy": 0.42857142857142855, "edit_distance": 4, "normalized_edit_distance": 0.5714285714285714, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.38095238095238093, "edit_distance": 26, "normalized_edit_distance": 0.6190476190476191, "word_accuracy": 0.0, "length_ratio": 0.6666666666666666, "predicted_length": 28, "ground_truth_length": 42 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.21052631578947367, "edit_distance": 15, "normalized_edit_distance": 0.7894736842105263, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 19, "ground_truth_length": 19 }, { "character_accuracy": 0.17647058823529413, "edit_distance": 14, "normalized_edit_distance": 0.8235294117647058, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7692307692307693, "edit_distance": 9, "normalized_edit_distance": 0.23076923076923078, "word_accuracy": 0.625, "length_ratio": 0.8717948717948718, "predicted_length": 34, "ground_truth_length": 39 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.7142857142857143, "predicted_length": 5, "ground_truth_length": 7 }, { "character_accuracy": 0.7058823529411765, "edit_distance": 15, "normalized_edit_distance": 0.29411764705882354, "word_accuracy": 0.5454545454545454, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.1590909090909091, "edit_distance": 37, "normalized_edit_distance": 0.8409090909090909, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 22, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1, "predicted_length": 1, "ground_truth_length": 10 }, { "character_accuracy": 0.3090909090909091, "edit_distance": 38, "normalized_edit_distance": 0.6909090909090909, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8181818181818182, "predicted_length": 45, "ground_truth_length": 55 }, { "character_accuracy": 0.4375, "edit_distance": 27, "normalized_edit_distance": 0.5625, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6041666666666666, "predicted_length": 29, "ground_truth_length": 48 }, { "character_accuracy": 0.9245283018867925, "edit_distance": 4, "normalized_edit_distance": 0.07547169811320754, "word_accuracy": 0.6666666666666666, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.6216216216216216, "edit_distance": 14, "normalized_edit_distance": 0.3783783783783784, "word_accuracy": 0.25, "length_ratio": 0.8648648648648649, "predicted_length": 32, "ground_truth_length": 37 }, { "character_accuracy": 0.4482758620689655, "edit_distance": 32, "normalized_edit_distance": 0.5517241379310345, "word_accuracy": 0.0, "length_ratio": 0.7758620689655172, "predicted_length": 45, "ground_truth_length": 58 }, { "character_accuracy": 0.4772727272727273, "edit_distance": 23, "normalized_edit_distance": 0.5227272727272727, "word_accuracy": 0.3333333333333333, "length_ratio": 0.6818181818181818, "predicted_length": 30, "ground_truth_length": 44 }, { "character_accuracy": 0.18181818181818182, "edit_distance": 27, "normalized_edit_distance": 0.8181818181818182, "word_accuracy": 0.0, "length_ratio": 0.6060606060606061, "predicted_length": 20, "ground_truth_length": 33 }, { "character_accuracy": 0.8275862068965517, "edit_distance": 10, "normalized_edit_distance": 0.1724137931034483, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9310344827586207, "predicted_length": 54, "ground_truth_length": 58 }, { "character_accuracy": 0.7083333333333334, "edit_distance": 14, "normalized_edit_distance": 0.2916666666666667, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.8205128205128205, "edit_distance": 7, "normalized_edit_distance": 0.1794871794871795, "word_accuracy": 0.2, "length_ratio": 0.9487179487179487, "predicted_length": 37, "ground_truth_length": 39 }, { "character_accuracy": 0.19047619047619047, "edit_distance": 34, "normalized_edit_distance": 0.8095238095238095, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 24, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.7674418604651163, "edit_distance": 20, "normalized_edit_distance": 0.23255813953488372, "word_accuracy": 0.2777777777777778, "length_ratio": 0.9302325581395349, "predicted_length": 80, "ground_truth_length": 86 }, { "character_accuracy": 0.18947368421052632, "edit_distance": 77, "normalized_edit_distance": 0.8105263157894737, "word_accuracy": 0.0, "length_ratio": 0.9368421052631579, "predicted_length": 89, "ground_truth_length": 95 }, { "character_accuracy": 0.2564102564102564, "edit_distance": 29, "normalized_edit_distance": 0.7435897435897436, "word_accuracy": 0.0, "length_ratio": 0.48717948717948717, "predicted_length": 19, "ground_truth_length": 39 }, { "character_accuracy": 0.9264705882352942, "edit_distance": 5, "normalized_edit_distance": 0.07352941176470588, "word_accuracy": 0.6923076923076923, "length_ratio": 0.9852941176470589, "predicted_length": 67, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.21428571428571427, "edit_distance": 11, "normalized_edit_distance": 0.7857142857142857, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 6, "ground_truth_length": 14 }, { "character_accuracy": 0.28125, "edit_distance": 23, "normalized_edit_distance": 0.71875, "word_accuracy": 0.0, "length_ratio": 0.78125, "predicted_length": 25, "ground_truth_length": 32 }, { "character_accuracy": 0.7872340425531915, "edit_distance": 10, "normalized_edit_distance": 0.2127659574468085, "word_accuracy": 0.5, "length_ratio": 0.8723404255319149, "predicted_length": 41, "ground_truth_length": 47 }, { "character_accuracy": 0.8571428571428571, "edit_distance": 7, "normalized_edit_distance": 0.14285714285714285, "word_accuracy": 0.6, "length_ratio": 0.9591836734693877, "predicted_length": 47, "ground_truth_length": 49 }, { "character_accuracy": 0.9263157894736842, "edit_distance": 7, "normalized_edit_distance": 0.07368421052631578, "word_accuracy": 0.7142857142857143, "length_ratio": 0.9578947368421052, "predicted_length": 91, "ground_truth_length": 95 }, { "character_accuracy": 0.20202020202020202, "edit_distance": 79, "normalized_edit_distance": 0.797979797979798, "word_accuracy": 0.0, "length_ratio": 1.010204081632653, "predicted_length": 99, "ground_truth_length": 98 }, { "character_accuracy": 0.6, "edit_distance": 4, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 8, "ground_truth_length": 10 }, { "character_accuracy": 0.8292682926829268, "edit_distance": 14, "normalized_edit_distance": 0.17073170731707318, "word_accuracy": 0.5, "length_ratio": 0.9146341463414634, "predicted_length": 75, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.2, "edit_distance": 32, "normalized_edit_distance": 0.8, "word_accuracy": 0.07692307692307693, "length_ratio": 1.8181818181818181, "predicted_length": 40, "ground_truth_length": 22 }, { "character_accuracy": 0.08333333333333333, "edit_distance": 33, "normalized_edit_distance": 0.9166666666666666, "word_accuracy": 0.0, "length_ratio": 0.2777777777777778, "predicted_length": 10, "ground_truth_length": 36 }, { "character_accuracy": 0.7272727272727273, "edit_distance": 12, "normalized_edit_distance": 0.2727272727272727, "word_accuracy": 0.2727272727272727, "length_ratio": 0.9318181818181818, "predicted_length": 41, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.21875, "edit_distance": 50, "normalized_edit_distance": 0.78125, "word_accuracy": 0.0, "length_ratio": 0.859375, "predicted_length": 55, "ground_truth_length": 64 }, { "character_accuracy": 0.31666666666666665, "edit_distance": 82, "normalized_edit_distance": 0.6833333333333333, "word_accuracy": 0.0, "length_ratio": 1.263157894736842, "predicted_length": 120, "ground_truth_length": 95 }, { "character_accuracy": 0.9210526315789473, "edit_distance": 3, "normalized_edit_distance": 0.07894736842105263, "word_accuracy": 0.5714285714285714, "length_ratio": 1.027027027027027, "predicted_length": 38, "ground_truth_length": 37 }, { "character_accuracy": 0.7931034482758621, "edit_distance": 12, "normalized_edit_distance": 0.20689655172413793, "word_accuracy": 0.09090909090909091, "length_ratio": 0.9482758620689655, "predicted_length": 55, "ground_truth_length": 58 }, { "character_accuracy": 0.4090909090909091, "edit_distance": 26, "normalized_edit_distance": 0.5909090909090909, "word_accuracy": 0.0, "length_ratio": 0.6590909090909091, "predicted_length": 29, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.76, "edit_distance": 12, "normalized_edit_distance": 0.24, "word_accuracy": 0.6, "length_ratio": 0.86, "predicted_length": 43, "ground_truth_length": 50 }, { "character_accuracy": 0.5588235294117647, "edit_distance": 15, "normalized_edit_distance": 0.4411764705882353, "word_accuracy": 0.2222222222222222, "length_ratio": 0.8823529411764706, "predicted_length": 30, "ground_truth_length": 34 }, { "character_accuracy": 0.8666666666666667, "edit_distance": 8, "normalized_edit_distance": 0.13333333333333333, "word_accuracy": 0.6153846153846154, "length_ratio": 0.95, "predicted_length": 57, "ground_truth_length": 60 }, { "character_accuracy": 0.8148148148148148, "edit_distance": 10, "normalized_edit_distance": 0.18518518518518517, "word_accuracy": 0.38461538461538464, "length_ratio": 0.9444444444444444, "predicted_length": 51, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.4, "edit_distance": 12, "normalized_edit_distance": 0.6, "word_accuracy": 0.0, "length_ratio": 0.65, "predicted_length": 13, "ground_truth_length": 20 }, { "character_accuracy": 0.2558139534883721, "edit_distance": 160, "normalized_edit_distance": 0.7441860465116279, "word_accuracy": 0.0, "length_ratio": 2.216494845360825, "predicted_length": 215, "ground_truth_length": 97 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 8, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.7272727272727273, "predicted_length": 8, "ground_truth_length": 11 }, { "character_accuracy": 0.2621359223300971, "edit_distance": 76, "normalized_edit_distance": 0.7378640776699029, "word_accuracy": 0.34615384615384615, "length_ratio": 1.0618556701030928, "predicted_length": 103, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 22, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 5, "ground_truth_length": 22 }, { "character_accuracy": 0.7636363636363637, "edit_distance": 13, "normalized_edit_distance": 0.23636363636363636, "word_accuracy": 0.4166666666666667, "length_ratio": 0.8363636363636363, "predicted_length": 46, "ground_truth_length": 55 }, { "character_accuracy": 0.25, "edit_distance": 6, "normalized_edit_distance": 0.75, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.16666666666666666, "predicted_length": 1, "ground_truth_length": 6 }, { "character_accuracy": 0.13333333333333333, "edit_distance": 13, "normalized_edit_distance": 0.8666666666666667, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 6, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.6727272727272727, "edit_distance": 18, "normalized_edit_distance": 0.32727272727272727, "word_accuracy": 0.18181818181818182, "length_ratio": 0.7818181818181819, "predicted_length": 43, "ground_truth_length": 55 }, { "character_accuracy": 0.6, "edit_distance": 2, "normalized_edit_distance": 0.4, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.3125, "edit_distance": 77, "normalized_edit_distance": 0.6875, "word_accuracy": 0.041666666666666664, "length_ratio": 0.8125, "predicted_length": 91, "ground_truth_length": 112 }, { "character_accuracy": 0.6666666666666666, "edit_distance": 16, "normalized_edit_distance": 0.3333333333333333, "word_accuracy": 0.4444444444444444, "length_ratio": 0.7708333333333334, "predicted_length": 37, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 8, "ground_truth_length": 16 }, { "character_accuracy": 0.8, "edit_distance": 9, "normalized_edit_distance": 0.2, "word_accuracy": 0.5, "length_ratio": 0.9333333333333333, "predicted_length": 42, "ground_truth_length": 45 }, { "character_accuracy": 0.86, "edit_distance": 7, "normalized_edit_distance": 0.14, "word_accuracy": 0.5555555555555556, "length_ratio": 0.98, "predicted_length": 49, "ground_truth_length": 50 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.42857142857142855, "predicted_length": 3, "ground_truth_length": 7 }, { "character_accuracy": 0.648936170212766, "edit_distance": 33, "normalized_edit_distance": 0.35106382978723405, "word_accuracy": 0.3, "length_ratio": 1.032967032967033, "predicted_length": 94, "ground_truth_length": 91 }, { "character_accuracy": 0.29411764705882354, "edit_distance": 12, "normalized_edit_distance": 0.7058823529411765, "word_accuracy": 0.0, "length_ratio": 0.6470588235294118, "predicted_length": 11, "ground_truth_length": 17 }, { "character_accuracy": 0.55, "edit_distance": 18, "normalized_edit_distance": 0.45, "word_accuracy": 0.25, "length_ratio": 0.6, "predicted_length": 24, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 3, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 1, "ground_truth_length": 3 }, { "character_accuracy": 0.7403846153846154, "edit_distance": 27, "normalized_edit_distance": 0.25961538461538464, "word_accuracy": 0.5238095238095238, "length_ratio": 0.8076923076923077, "predicted_length": 84, "ground_truth_length": 104 }, { "character_accuracy": 0.7604166666666666, "edit_distance": 23, "normalized_edit_distance": 0.23958333333333334, "word_accuracy": 0.45, "length_ratio": 0.8541666666666666, "predicted_length": 82, "ground_truth_length": 96 }, { "character_accuracy": 0.8095238095238095, "edit_distance": 8, "normalized_edit_distance": 0.19047619047619047, "word_accuracy": 0.5454545454545454, "length_ratio": 0.9761904761904762, "predicted_length": 41, "ground_truth_length": 42 }, { "character_accuracy": 0.7045454545454546, "edit_distance": 13, "normalized_edit_distance": 0.29545454545454547, "word_accuracy": 0.375, "length_ratio": 0.7954545454545454, "predicted_length": 35, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 3, "ground_truth_length": 5 }, { "character_accuracy": 0.23076923076923078, "edit_distance": 20, "normalized_edit_distance": 0.7692307692307693, "word_accuracy": 0.0, "length_ratio": 0.5384615384615384, "predicted_length": 14, "ground_truth_length": 26 }, { "character_accuracy": 0.4375, "edit_distance": 9, "normalized_edit_distance": 0.5625, "word_accuracy": 0.0, "length_ratio": 0.625, "predicted_length": 10, "ground_truth_length": 16 }, { "character_accuracy": 0.7666666666666667, "edit_distance": 14, "normalized_edit_distance": 0.23333333333333334, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.8135593220338984, "edit_distance": 11, "normalized_edit_distance": 0.1864406779661017, "word_accuracy": 0.5, "length_ratio": 0.9152542372881356, "predicted_length": 54, "ground_truth_length": 59 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.2727272727272727, "edit_distance": 24, "normalized_edit_distance": 0.7272727272727273, "word_accuracy": 0.0, "length_ratio": 0.48484848484848486, "predicted_length": 16, "ground_truth_length": 33 }, { "character_accuracy": 0.22641509433962265, "edit_distance": 41, "normalized_edit_distance": 0.7735849056603774, "word_accuracy": 0.0, "length_ratio": 0.37735849056603776, "predicted_length": 20, "ground_truth_length": 53 }, { "character_accuracy": 0.819672131147541, "edit_distance": 11, "normalized_edit_distance": 0.18032786885245902, "word_accuracy": 0.45454545454545453, "length_ratio": 0.9016393442622951, "predicted_length": 55, "ground_truth_length": 61 } ] } ], "training_config": { "dataset_name": "CATMuS/medieval", "model_name": "LiquidAI/LFM2-VL-450M", "max_steps": 10000, "eval_steps": 500, "num_accumulation_steps": 1, "learning_rate": 1e-05, "train_batch_size": 2, "val_batch_size": 2, "train_select_start": 0, "train_select_end": 148000, "val_select_start": 148001, "val_select_end": 150000, "train_field": "train", "val_field": "train", "image_column": "im", "text_column": "text", "user_text": "Transcribe this medieval manuscript line.", "max_image_size": 200 }, "pre_training_eval": { "loss": 1.2974295389652253, "perplexity": 3.659877061843872, "min_loss": 0.9512767791748047, "max_loss": 1.703115463256836, "num_samples": 100, "num_batches": 50, "avg_char_accuracy": 0.27680277119292407, "avg_word_accuracy": 0.11646049990689945, "avg_edit_distance": 33.17, "avg_normalized_edit_distance": 0.7231972288070756, "avg_length_ratio": 0.9951391574082407, "text_samples_evaluated": 100, "detailed_text_metrics": [ { "character_accuracy": 0.9069767441860465, "edit_distance": 4, "normalized_edit_distance": 0.09302325581395349, "word_accuracy": 0.5, "length_ratio": 1.0, "predicted_length": 43, "ground_truth_length": 43 }, { "character_accuracy": 0.034482758620689655, "edit_distance": 28, "normalized_edit_distance": 0.9655172413793104, "word_accuracy": 0.0, "length_ratio": 2.9, "predicted_length": 29, "ground_truth_length": 10 }, { "character_accuracy": 0.6226415094339622, "edit_distance": 20, "normalized_edit_distance": 0.37735849056603776, "word_accuracy": 0.25, "length_ratio": 0.7358490566037735, "predicted_length": 39, "ground_truth_length": 53 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 2, "ground_truth_length": 5 }, { "character_accuracy": 0.2803030303030303, "edit_distance": 95, "normalized_edit_distance": 0.7196969696969697, "word_accuracy": 0.13793103448275862, "length_ratio": 1.5348837209302326, "predicted_length": 132, "ground_truth_length": 86 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.34375, "edit_distance": 42, "normalized_edit_distance": 0.65625, "word_accuracy": 0.0, "length_ratio": 1.1636363636363636, "predicted_length": 64, "ground_truth_length": 55 }, { "character_accuracy": 0.16666666666666666, "edit_distance": 15, "normalized_edit_distance": 0.8333333333333334, "word_accuracy": 0.0, "length_ratio": 2.5714285714285716, "predicted_length": 18, "ground_truth_length": 7 }, { "character_accuracy": 0.11904761904761904, "edit_distance": 37, "normalized_edit_distance": 0.8809523809523809, "word_accuracy": 0.0, "length_ratio": 0.6190476190476191, "predicted_length": 26, "ground_truth_length": 42 }, { "character_accuracy": 0.8, "edit_distance": 1, "normalized_edit_distance": 0.2, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 19, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3684210526315789, "predicted_length": 7, "ground_truth_length": 19 }, { "character_accuracy": 0.058823529411764705, "edit_distance": 16, "normalized_edit_distance": 0.9411764705882353, "word_accuracy": 0.0, "length_ratio": 0.47058823529411764, "predicted_length": 8, "ground_truth_length": 17 }, { "character_accuracy": 0.7435897435897436, "edit_distance": 10, "normalized_edit_distance": 0.2564102564102564, "word_accuracy": 0.4444444444444444, "length_ratio": 0.8461538461538461, "predicted_length": 33, "ground_truth_length": 39 }, { "character_accuracy": 0.14285714285714285, "edit_distance": 6, "normalized_edit_distance": 0.8571428571428571, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 18, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.4166666666666667, "length_ratio": 0.7843137254901961, "predicted_length": 40, "ground_truth_length": 51 }, { "character_accuracy": 0.29545454545454547, "edit_distance": 31, "normalized_edit_distance": 0.7045454545454546, "word_accuracy": 0.1111111111111111, "length_ratio": 0.7045454545454546, "predicted_length": 31, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.18181818181818182, "predicted_length": 10, "ground_truth_length": 55 }, { "character_accuracy": 0.265625, "edit_distance": 47, "normalized_edit_distance": 0.734375, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 64, "ground_truth_length": 48 }, { "character_accuracy": 0.8867924528301887, "edit_distance": 6, "normalized_edit_distance": 0.11320754716981132, "word_accuracy": 0.5384615384615384, "length_ratio": 1.0, "predicted_length": 53, "ground_truth_length": 53 }, { "character_accuracy": 0.5405405405405406, "edit_distance": 17, "normalized_edit_distance": 0.4594594594594595, "word_accuracy": 0.2857142857142857, "length_ratio": 0.7027027027027027, "predicted_length": 26, "ground_truth_length": 37 }, { "character_accuracy": 0.0, "edit_distance": 58, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.1896551724137931, "predicted_length": 11, "ground_truth_length": 58 }, { "character_accuracy": 0.045454545454545456, "edit_distance": 42, "normalized_edit_distance": 0.9545454545454546, "word_accuracy": 0.0, "length_ratio": 0.20454545454545456, "predicted_length": 9, "ground_truth_length": 44 }, { "character_accuracy": 0.030303030303030304, "edit_distance": 32, "normalized_edit_distance": 0.9696969696969697, "word_accuracy": 0.0, "length_ratio": 0.30303030303030304, "predicted_length": 10, "ground_truth_length": 33 }, { "character_accuracy": 0.20689655172413793, "edit_distance": 46, "normalized_edit_distance": 0.7931034482758621, "word_accuracy": 0.0, "length_ratio": 0.9137931034482759, "predicted_length": 53, "ground_truth_length": 58 }, { "character_accuracy": 0.75, "edit_distance": 12, "normalized_edit_distance": 0.25, "word_accuracy": 0.42857142857142855, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.5384615384615384, "edit_distance": 18, "normalized_edit_distance": 0.46153846153846156, "word_accuracy": 0.1111111111111111, "length_ratio": 0.717948717948718, "predicted_length": 28, "ground_truth_length": 39 }, { "character_accuracy": 0.23809523809523808, "edit_distance": 32, "normalized_edit_distance": 0.7619047619047619, "word_accuracy": 0.0, "length_ratio": 0.8095238095238095, "predicted_length": 34, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.872093023255814, "edit_distance": 11, "normalized_edit_distance": 0.12790697674418605, "word_accuracy": 0.6428571428571429, "length_ratio": 0.9418604651162791, "predicted_length": 81, "ground_truth_length": 86 }, { "character_accuracy": 0.7789473684210526, "edit_distance": 21, "normalized_edit_distance": 0.22105263157894736, "word_accuracy": 0.7333333333333333, "length_ratio": 0.8315789473684211, "predicted_length": 79, "ground_truth_length": 95 }, { "character_accuracy": 0.8974358974358975, "edit_distance": 4, "normalized_edit_distance": 0.10256410256410256, "word_accuracy": 0.75, "length_ratio": 0.8974358974358975, "predicted_length": 35, "ground_truth_length": 39 }, { "character_accuracy": 0.26804123711340205, "edit_distance": 71, "normalized_edit_distance": 0.7319587628865979, "word_accuracy": 0.0, "length_ratio": 1.4264705882352942, "predicted_length": 97, "ground_truth_length": 68 }, { "character_accuracy": 0.0, "edit_distance": 2, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 1, "ground_truth_length": 2 }, { "character_accuracy": 0.0, "edit_distance": 14, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.21428571428571427, "predicted_length": 3, "ground_truth_length": 14 }, { "character_accuracy": 0.1702127659574468, "edit_distance": 39, "normalized_edit_distance": 0.8297872340425532, "word_accuracy": 0.0, "length_ratio": 1.46875, "predicted_length": 47, "ground_truth_length": 32 }, { "character_accuracy": 0.1702127659574468, "edit_distance": 39, "normalized_edit_distance": 0.8297872340425532, "word_accuracy": 0.0, "length_ratio": 0.8297872340425532, "predicted_length": 39, "ground_truth_length": 47 }, { "character_accuracy": 0.234375, "edit_distance": 49, "normalized_edit_distance": 0.765625, "word_accuracy": 0.058823529411764705, "length_ratio": 1.3061224489795917, "predicted_length": 64, "ground_truth_length": 49 }, { "character_accuracy": 0.20967741935483872, "edit_distance": 147, "normalized_edit_distance": 0.7903225806451613, "word_accuracy": 0.0, "length_ratio": 1.9578947368421054, "predicted_length": 186, "ground_truth_length": 95 }, { "character_accuracy": 0.20207253886010362, "edit_distance": 154, "normalized_edit_distance": 0.7979274611398963, "word_accuracy": 0.0, "length_ratio": 1.969387755102041, "predicted_length": 193, "ground_truth_length": 98 }, { "character_accuracy": 0.1, "edit_distance": 9, "normalized_edit_distance": 0.9, "word_accuracy": 0.0, "length_ratio": 0.6, "predicted_length": 6, "ground_truth_length": 10 }, { "character_accuracy": 0.4024390243902439, "edit_distance": 49, "normalized_edit_distance": 0.5975609756097561, "word_accuracy": 0.0625, "length_ratio": 0.9634146341463414, "predicted_length": 79, "ground_truth_length": 82 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 2, "ground_truth_length": 10 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.1956521739130435, "edit_distance": 37, "normalized_edit_distance": 0.8043478260869565, "word_accuracy": 0.0, "length_ratio": 2.090909090909091, "predicted_length": 46, "ground_truth_length": 22 }, { "character_accuracy": 0.19444444444444445, "edit_distance": 29, "normalized_edit_distance": 0.8055555555555556, "word_accuracy": 0.0, "length_ratio": 0.4722222222222222, "predicted_length": 17, "ground_truth_length": 36 }, { "character_accuracy": 0.7954545454545454, "edit_distance": 9, "normalized_edit_distance": 0.20454545454545456, "word_accuracy": 0.5555555555555556, "length_ratio": 0.9090909090909091, "predicted_length": 40, "ground_truth_length": 44 }, { "character_accuracy": 0.7708333333333334, "edit_distance": 11, "normalized_edit_distance": 0.22916666666666666, "word_accuracy": 0.625, "length_ratio": 0.8541666666666666, "predicted_length": 41, "ground_truth_length": 48 }, { "character_accuracy": 0.4375, "edit_distance": 36, "normalized_edit_distance": 0.5625, "word_accuracy": 0.0, "length_ratio": 0.96875, "predicted_length": 62, "ground_truth_length": 64 }, { "character_accuracy": 0.23469387755102042, "edit_distance": 150, "normalized_edit_distance": 0.7653061224489796, "word_accuracy": 0.0, "length_ratio": 2.0631578947368423, "predicted_length": 196, "ground_truth_length": 95 }, { "character_accuracy": 0.2972972972972973, "edit_distance": 26, "normalized_edit_distance": 0.7027027027027027, "word_accuracy": 0.125, "length_ratio": 0.6216216216216216, "predicted_length": 23, "ground_truth_length": 37 }, { "character_accuracy": 0.13793103448275862, "edit_distance": 50, "normalized_edit_distance": 0.8620689655172413, "word_accuracy": 0.0, "length_ratio": 0.9655172413793104, "predicted_length": 56, "ground_truth_length": 58 }, { "character_accuracy": 0.13636363636363635, "edit_distance": 38, "normalized_edit_distance": 0.8636363636363636, "word_accuracy": 0.0, "length_ratio": 0.5681818181818182, "predicted_length": 25, "ground_truth_length": 44 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.72, "edit_distance": 14, "normalized_edit_distance": 0.28, "word_accuracy": 0.6, "length_ratio": 0.84, "predicted_length": 42, "ground_truth_length": 50 }, { "character_accuracy": 0.6470588235294118, "edit_distance": 12, "normalized_edit_distance": 0.35294117647058826, "word_accuracy": 0.2857142857142857, "length_ratio": 0.7941176470588235, "predicted_length": 27, "ground_truth_length": 34 }, { "character_accuracy": 0.0, "edit_distance": 60, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.23333333333333334, "predicted_length": 14, "ground_truth_length": 60 }, { "character_accuracy": 0.23076923076923078, "edit_distance": 70, "normalized_edit_distance": 0.7692307692307693, "word_accuracy": 0.0, "length_ratio": 1.6851851851851851, "predicted_length": 91, "ground_truth_length": 54 }, { "character_accuracy": 0.0, "edit_distance": 13, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 2.6, "predicted_length": 13, "ground_truth_length": 5 }, { "character_accuracy": 0.3333333333333333, "edit_distance": 4, "normalized_edit_distance": 0.6666666666666666, "word_accuracy": 0.0, "length_ratio": 0.3333333333333333, "predicted_length": 2, "ground_truth_length": 6 }, { "character_accuracy": 0.8888888888888888, "edit_distance": 5, "normalized_edit_distance": 0.1111111111111111, "word_accuracy": 0.6666666666666666, "length_ratio": 0.9777777777777777, "predicted_length": 44, "ground_truth_length": 45 }, { "character_accuracy": 0.0, "edit_distance": 20, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 4, "ground_truth_length": 20 }, { "character_accuracy": 0.2561576354679803, "edit_distance": 151, "normalized_edit_distance": 0.7438423645320197, "word_accuracy": 0.0, "length_ratio": 2.0927835051546393, "predicted_length": 203, "ground_truth_length": 97 }, { "character_accuracy": 0.12244897959183673, "edit_distance": 43, "normalized_edit_distance": 0.8775510204081632, "word_accuracy": 0.0, "length_ratio": 4.454545454545454, "predicted_length": 49, "ground_truth_length": 11 }, { "character_accuracy": 0.25961538461538464, "edit_distance": 77, "normalized_edit_distance": 0.7403846153846154, "word_accuracy": 0.36, "length_ratio": 1.0721649484536082, "predicted_length": 104, "ground_truth_length": 97 }, { "character_accuracy": 0.0, "edit_distance": 7, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.1891891891891892, "edit_distance": 30, "normalized_edit_distance": 0.8108108108108109, "word_accuracy": 0.0, "length_ratio": 1.6818181818181819, "predicted_length": 37, "ground_truth_length": 22 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.23636363636363636, "predicted_length": 13, "ground_truth_length": 55 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.5, "predicted_length": 4, "ground_truth_length": 8 }, { "character_accuracy": 0.625, "edit_distance": 3, "normalized_edit_distance": 0.375, "word_accuracy": 0.0, "length_ratio": 1.1428571428571428, "predicted_length": 8, "ground_truth_length": 7 }, { "character_accuracy": 0.0, "edit_distance": 6, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.0, "predicted_length": 6, "ground_truth_length": 6 }, { "character_accuracy": 0.26666666666666666, "edit_distance": 11, "normalized_edit_distance": 0.7333333333333333, "word_accuracy": 0.0, "length_ratio": 0.5333333333333333, "predicted_length": 8, "ground_truth_length": 15 }, { "character_accuracy": 0.0, "edit_distance": 8, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.25, "predicted_length": 2, "ground_truth_length": 8 }, { "character_accuracy": 0.0, "edit_distance": 55, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2909090909090909, "predicted_length": 16, "ground_truth_length": 55 }, { "character_accuracy": 0.03125, "edit_distance": 31, "normalized_edit_distance": 0.96875, "word_accuracy": 0.0, "length_ratio": 6.4, "predicted_length": 32, "ground_truth_length": 5 }, { "character_accuracy": 0.625, "edit_distance": 42, "normalized_edit_distance": 0.375, "word_accuracy": 0.5454545454545454, "length_ratio": 0.6607142857142857, "predicted_length": 74, "ground_truth_length": 112 }, { "character_accuracy": 0.11538461538461539, "edit_distance": 46, "normalized_edit_distance": 0.8846153846153846, "word_accuracy": 0.0, "length_ratio": 1.0833333333333333, "predicted_length": 52, "ground_truth_length": 48 }, { "character_accuracy": 0.125, "edit_distance": 14, "normalized_edit_distance": 0.875, "word_accuracy": 0.0, "length_ratio": 0.5625, "predicted_length": 9, "ground_truth_length": 16 }, { "character_accuracy": 0.2602739726027397, "edit_distance": 54, "normalized_edit_distance": 0.7397260273972602, "word_accuracy": 0.0, "length_ratio": 1.6222222222222222, "predicted_length": 73, "ground_truth_length": 45 }, { "character_accuracy": 0.24444444444444444, "edit_distance": 68, "normalized_edit_distance": 0.7555555555555555, "word_accuracy": 0.0, "length_ratio": 1.8, "predicted_length": 90, "ground_truth_length": 50 }, { "character_accuracy": 0.2857142857142857, "edit_distance": 5, "normalized_edit_distance": 0.7142857142857143, "word_accuracy": 0.0, "length_ratio": 0.5714285714285714, "predicted_length": 4, "ground_truth_length": 7 }, { "character_accuracy": 0.22123893805309736, "edit_distance": 88, "normalized_edit_distance": 0.7787610619469026, "word_accuracy": 0.0, "length_ratio": 1.2417582417582418, "predicted_length": 113, "ground_truth_length": 91 }, { "character_accuracy": 0.1724137931034483, "edit_distance": 24, "normalized_edit_distance": 0.8275862068965517, "word_accuracy": 0.0, "length_ratio": 1.7058823529411764, "predicted_length": 29, "ground_truth_length": 17 }, { "character_accuracy": 0.65, "edit_distance": 14, "normalized_edit_distance": 0.35, "word_accuracy": 0.5714285714285714, "length_ratio": 0.675, "predicted_length": 27, "ground_truth_length": 40 }, { "character_accuracy": 0.0, "edit_distance": 5, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.2, "predicted_length": 1, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 4, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 1.3333333333333333, "predicted_length": 4, "ground_truth_length": 3 }, { "character_accuracy": 0.2346368715083799, "edit_distance": 137, "normalized_edit_distance": 0.7653631284916201, "word_accuracy": 0.0, "length_ratio": 1.7211538461538463, "predicted_length": 179, "ground_truth_length": 104 }, { "character_accuracy": 0.22839506172839505, "edit_distance": 125, "normalized_edit_distance": 0.7716049382716049, "word_accuracy": 0.0, "length_ratio": 1.6875, "predicted_length": 162, "ground_truth_length": 96 }, { "character_accuracy": 0.47619047619047616, "edit_distance": 22, "normalized_edit_distance": 0.5238095238095238, "word_accuracy": 0.15384615384615385, "length_ratio": 0.9285714285714286, "predicted_length": 39, "ground_truth_length": 42 }, { "character_accuracy": 0.0, "edit_distance": 44, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.22727272727272727, "predicted_length": 10, "ground_truth_length": 44 }, { "character_accuracy": 0.2, "edit_distance": 4, "normalized_edit_distance": 0.8, "word_accuracy": 0.0, "length_ratio": 0.8, "predicted_length": 4, "ground_truth_length": 5 }, { "character_accuracy": 0.0, "edit_distance": 26, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.3076923076923077, "predicted_length": 8, "ground_truth_length": 26 }, { "character_accuracy": 0.16, "edit_distance": 21, "normalized_edit_distance": 0.84, "word_accuracy": 0.0, "length_ratio": 1.5625, "predicted_length": 25, "ground_truth_length": 16 }, { "character_accuracy": 0.75, "edit_distance": 15, "normalized_edit_distance": 0.25, "word_accuracy": 0.6666666666666666, "length_ratio": 0.8333333333333334, "predicted_length": 50, "ground_truth_length": 60 }, { "character_accuracy": 0.6440677966101694, "edit_distance": 21, "normalized_edit_distance": 0.3559322033898305, "word_accuracy": 0.36363636363636365, "length_ratio": 0.6949152542372882, "predicted_length": 41, "ground_truth_length": 59 }, { "character_accuracy": 0.0, "edit_distance": 10, "normalized_edit_distance": 1.0, "word_accuracy": 0.0, "length_ratio": 0.4, "predicted_length": 4, "ground_truth_length": 10 }, { "character_accuracy": 0.24242424242424243, "edit_distance": 25, "normalized_edit_distance": 0.7575757575757576, "word_accuracy": 0.0, "length_ratio": 0.5151515151515151, "predicted_length": 17, "ground_truth_length": 33 }, { "character_accuracy": 0.23636363636363636, "edit_distance": 42, "normalized_edit_distance": 0.7636363636363637, "word_accuracy": 0.05555555555555555, "length_ratio": 1.0377358490566038, "predicted_length": 55, "ground_truth_length": 53 }, { "character_accuracy": 0.8688524590163934, "edit_distance": 8, "normalized_edit_distance": 0.13114754098360656, "word_accuracy": 0.6, "length_ratio": 0.9672131147540983, "predicted_length": 59, "ground_truth_length": 61 } ] }, "post_training_eval": null, "base_model": "LiquidAI/LFM2-VL-450M", "generated_at": "2025-08-18T20:39:32.807423" }