flytech commited on
Commit
2cc573a
1 Parent(s): 898781a

Training in progress, step 1900, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb2949c288c43991698176ffbd5aa30aed17f67428acf5a2ec2d8b5e97b044e
3
  size 160285149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af6d42d568c10c05bd0a235b35138ad5ac51f2a52cb724441cd7bfb5e2d9653f
3
  size 160285149
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d780045b7ba04666ddb94197b3702ccc98c54e1ba36cf994425e87905fd032e
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b5c2cb2dfb3f60750713c8e1a124a5bce3de66d8a6642dd7a6723300b51429a
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be50d991d0ad05925161d2b4ecb2ad706ca272d5d5a04ebcad5d79266d1efcea
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:504ae0bcaabd05c86ca42a16a90534b6c93ee4e2544d2c7bdfb57fa3e94a82bc
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.6666666666666665,
5
  "eval_steps": 100,
6
- "global_step": 1800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -241,13 +241,26 @@
241
  "eval_samples_per_second": 1.903,
242
  "eval_steps_per_second": 0.239,
243
  "step": 1800
 
 
 
 
 
 
 
 
 
 
 
 
 
244
  }
245
  ],
246
  "logging_steps": 100,
247
  "max_steps": 2025,
248
  "num_train_epochs": 3,
249
  "save_steps": 100,
250
- "total_flos": 3.74832717889536e+17,
251
  "trial_name": null,
252
  "trial_params": null
253
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.814814814814815,
5
  "eval_steps": 100,
6
+ "global_step": 1900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
241
  "eval_samples_per_second": 1.903,
242
  "eval_steps_per_second": 0.239,
243
  "step": 1800
244
+ },
245
+ {
246
+ "epoch": 2.81,
247
+ "learning_rate": 0.0,
248
+ "loss": 8.657,
249
+ "step": 1900
250
+ },
251
+ {
252
+ "epoch": 2.81,
253
+ "eval_runtime": 787.6516,
254
+ "eval_samples_per_second": 1.904,
255
+ "eval_steps_per_second": 0.239,
256
+ "step": 1900
257
  }
258
  ],
259
  "logging_steps": 100,
260
  "max_steps": 2025,
261
  "num_train_epochs": 3,
262
  "save_steps": 100,
263
+ "total_flos": 3.95656757772288e+17,
264
  "trial_name": null,
265
  "trial_params": null
266
  }