| { | |
| "best_epoch": 2, | |
| "best_loss": 0.07834781419772369, | |
| "best_checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000002.safetensors", | |
| "total_epochs": 24, | |
| "all_losses": [ | |
| { | |
| "epoch": 1, | |
| "loss": 0.0983309017924162, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000001.safetensors", | |
| "global_step": 13 | |
| }, | |
| { | |
| "epoch": 2, | |
| "loss": 0.07834781419772369, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000002.safetensors", | |
| "global_step": 26 | |
| }, | |
| { | |
| "epoch": 3, | |
| "loss": 0.1946192876650737, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000003.safetensors", | |
| "global_step": 39 | |
| }, | |
| { | |
| "epoch": 4, | |
| "loss": 3.9677493205437293, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000004.safetensors", | |
| "global_step": 52 | |
| }, | |
| { | |
| "epoch": 5, | |
| "loss": 0.7346479594707489, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000005.safetensors", | |
| "global_step": 65 | |
| }, | |
| { | |
| "epoch": 6, | |
| "loss": 0.7469201248425704, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000006.safetensors", | |
| "global_step": 78 | |
| }, | |
| { | |
| "epoch": 7, | |
| "loss": 0.700389550282405, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000007.safetensors", | |
| "global_step": 91 | |
| }, | |
| { | |
| "epoch": 8, | |
| "loss": 0.7346234115270468, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000008.safetensors", | |
| "global_step": 104 | |
| }, | |
| { | |
| "epoch": 9, | |
| "loss": 0.7212961820455698, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000009.safetensors", | |
| "global_step": 117 | |
| }, | |
| { | |
| "epoch": 10, | |
| "loss": 0.6475075506247007, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000010.safetensors", | |
| "global_step": 130 | |
| }, | |
| { | |
| "epoch": 11, | |
| "loss": 0.6152113057099856, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000011.safetensors", | |
| "global_step": 143 | |
| }, | |
| { | |
| "epoch": 12, | |
| "loss": 0.7991792032351861, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000012.safetensors", | |
| "global_step": 156 | |
| }, | |
| { | |
| "epoch": 13, | |
| "loss": 0.6762913018465042, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000013.safetensors", | |
| "global_step": 169 | |
| }, | |
| { | |
| "epoch": 14, | |
| "loss": 0.7254251264608823, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000014.safetensors", | |
| "global_step": 182 | |
| }, | |
| { | |
| "epoch": 15, | |
| "loss": 0.708387180016591, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000015.safetensors", | |
| "global_step": 195 | |
| }, | |
| { | |
| "epoch": 16, | |
| "loss": 0.6945093090717609, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000016.safetensors", | |
| "global_step": 208 | |
| }, | |
| { | |
| "epoch": 17, | |
| "loss": 0.7329169397170727, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000017.safetensors", | |
| "global_step": 221 | |
| }, | |
| { | |
| "epoch": 18, | |
| "loss": 0.7032873630523682, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000018.safetensors", | |
| "global_step": 234 | |
| }, | |
| { | |
| "epoch": 19, | |
| "loss": 0.8162262852375324, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000019.safetensors", | |
| "global_step": 247 | |
| }, | |
| { | |
| "epoch": 20, | |
| "loss": 0.7767565181622138, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000020.safetensors", | |
| "global_step": 260 | |
| }, | |
| { | |
| "epoch": 21, | |
| "loss": 0.6119314363369575, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000021.safetensors", | |
| "global_step": 273 | |
| }, | |
| { | |
| "epoch": 22, | |
| "loss": 0.7206398065273578, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000022.safetensors", | |
| "global_step": 286 | |
| }, | |
| { | |
| "epoch": 23, | |
| "loss": 0.6361816445222268, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000023.safetensors", | |
| "global_step": 299 | |
| }, | |
| { | |
| "epoch": 24, | |
| "loss": 0.8124457013148528, | |
| "checkpoint": "/app/checkpoints/3c7f6249-80ac-4a5b-b06f-6ae456b30edc/3c7f6249-80ac-4a5b-b06f-6ae456bsuai3/last-000024.safetensors", | |
| "global_step": 312 | |
| } | |
| ] | |
| } |