hofarah commited on
Commit
120cdd1
1 Parent(s): 9e33483

Training in progress, step 200

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4dc7b5a5ba3656e7e3ba33577f9d5c221551eb9ac38a8241da63b379cad73607
3
  size 3544920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fb09faafe86c3f8a3809c282ff2b33e506a3661a79e5616b8276d0b82097d48
3
  size 3544920
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:694ade40292a0236fc581f36db7f75221ac5f2bf62938e0d5acefb6040f8d4ce
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:897b7b593f9821dbb0e2ae6d611894c506aa52d82fe38b6c5255a258f0b4cb62
3
  size 1140034381
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5134742d8a3e0eb4235ccb75ae0c32f1d18107769b8c95d8a28999819cb8fa18
3
- size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46c7746ace7f5308e25daef2d7e569acf6cec5538b3a1f0aa281a80ddbbed1a8
3
+ size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5e25f2c0298e32eb32bc4fd13a32a452c19048d5a88e784c5908ed1a05a2bbb1
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da8d90b6a7613e88ebb00326afe3e46f5e2c7dab4f2323f113d4b53f6fc1eea8
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.2929292929292928,
5
- "global_step": 160,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -242,11 +242,70 @@
242
  "eval_samples_per_second": 0.073,
243
  "eval_steps_per_second": 0.038,
244
  "step": 160
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
245
  }
246
  ],
247
  "max_steps": 369,
248
  "num_train_epochs": 3,
249
- "total_flos": 6243604695613440.0,
250
  "trial_name": null,
251
  "trial_params": null
252
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.6161616161616161,
5
+ "global_step": 200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
242
  "eval_samples_per_second": 0.073,
243
  "eval_steps_per_second": 0.038,
244
  "step": 160
245
+ },
246
+ {
247
+ "epoch": 1.33,
248
+ "learning_rate": 2.7913279132791332e-05,
249
+ "loss": 3.0798,
250
+ "step": 165
251
+ },
252
+ {
253
+ "epoch": 1.37,
254
+ "learning_rate": 2.7235772357723577e-05,
255
+ "loss": 3.2169,
256
+ "step": 170
257
+ },
258
+ {
259
+ "epoch": 1.41,
260
+ "learning_rate": 2.6558265582655828e-05,
261
+ "loss": 3.4364,
262
+ "step": 175
263
+ },
264
+ {
265
+ "epoch": 1.45,
266
+ "learning_rate": 2.588075880758808e-05,
267
+ "loss": 3.2353,
268
+ "step": 180
269
+ },
270
+ {
271
+ "epoch": 1.49,
272
+ "learning_rate": 2.5203252032520324e-05,
273
+ "loss": 3.4389,
274
+ "step": 185
275
+ },
276
+ {
277
+ "epoch": 1.54,
278
+ "learning_rate": 2.4525745257452575e-05,
279
+ "loss": 3.2847,
280
+ "step": 190
281
+ },
282
+ {
283
+ "epoch": 1.58,
284
+ "learning_rate": 2.3848238482384823e-05,
285
+ "loss": 3.0442,
286
+ "step": 195
287
+ },
288
+ {
289
+ "epoch": 1.62,
290
+ "learning_rate": 2.3170731707317075e-05,
291
+ "loss": 3.2043,
292
+ "step": 200
293
+ },
294
+ {
295
+ "epoch": 1.62,
296
+ "eval_loss": 3.1420483589172363,
297
+ "eval_rouge2_fmeasure": 0.0032,
298
+ "eval_rouge2_precision": 0.0041,
299
+ "eval_rouge2_recall": 0.0026,
300
+ "eval_runtime": 417.3311,
301
+ "eval_samples_per_second": 0.065,
302
+ "eval_steps_per_second": 0.034,
303
+ "step": 200
304
  }
305
  ],
306
  "max_steps": 369,
307
  "num_train_epochs": 3,
308
+ "total_flos": 7804505869516800.0,
309
  "trial_name": null,
310
  "trial_params": null
311
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:694ade40292a0236fc581f36db7f75221ac5f2bf62938e0d5acefb6040f8d4ce
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:897b7b593f9821dbb0e2ae6d611894c506aa52d82fe38b6c5255a258f0b4cb62
3
  size 1140034381