robiulawaldev commited on
Commit
a56fc4d
·
verified ·
1 Parent(s): d0f450f

Training in progress, step 12, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:749512039905e54b4fda9b285bfa58998f095aabc18773c9ece09be87caff2a0
3
  size 20312676
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc542b89b2fb409ffa2a15b109a533053ba9987b3cb65f997a66fde03c3ca98f
3
  size 20312676
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6089a8858f8deb2de47fb0521be50994912c13387776ea61d86b7928ecdc7e3
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93b8ffb6cde37ebd1d1f1709c31c7b1e2378a4fc738f0c955225ffcdfe0b8dc
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d7b358298aa83a40c1b56e5c320426fa83976856684a928a0b4adb7fc547539
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c3f3d5c4a86eb24d6104ecbafd33bca7426420d96c84e1b2c30df274293a5af
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.64,
5
  "eval_steps": 4,
6
- "global_step": 8,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -31,6 +31,21 @@
31
  "eval_samples_per_second": 70.793,
32
  "eval_steps_per_second": 23.598,
33
  "step": 8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  }
35
  ],
36
  "logging_steps": 10,
@@ -50,7 +65,7 @@
50
  "attributes": {}
51
  }
52
  },
53
- "total_flos": 22801104764928.0,
54
  "train_batch_size": 4,
55
  "trial_name": null,
56
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.96,
5
  "eval_steps": 4,
6
+ "global_step": 12,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
31
  "eval_samples_per_second": 70.793,
32
  "eval_steps_per_second": 23.598,
33
  "step": 8
34
+ },
35
+ {
36
+ "epoch": 0.8,
37
+ "grad_norm": NaN,
38
+ "learning_rate": 0.0002,
39
+ "loss": 0.0,
40
+ "step": 10
41
+ },
42
+ {
43
+ "epoch": 0.96,
44
+ "eval_loss": NaN,
45
+ "eval_runtime": 0.0834,
46
+ "eval_samples_per_second": 71.935,
47
+ "eval_steps_per_second": 23.978,
48
+ "step": 12
49
  }
50
  ],
51
  "logging_steps": 10,
 
65
  "attributes": {}
66
  }
67
  },
68
+ "total_flos": 34201657147392.0,
69
  "train_batch_size": 4,
70
  "trial_name": null,
71
  "trial_params": null