hofarah commited on
Commit
dc83601
1 Parent(s): d6e65de

Training in progress, step 320

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d327d6055b26512249f738b530183f923a688879d89aee01c1a7f129ad20292b
3
  size 3545432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:717aeabd41162df58c589016e262864ca577bac403e982cd24e9397df8d808b9
3
  size 3545432
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e431d6677e21cb70645f73a949e7a206eba6b539e4319051fde1cf766602b528
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7dc2e0c6eac7de952444cda2f8a83b2d8ea1e3e332c7b71d88efa3373715d8
3
  size 1140034381
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b11dc40821345160db396d3d3b1fc931f4d0a9c790f3c549a309cd06fb1f698
3
- size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b2ebb2a66011e7d1a3811ef684f1282f4aaec21ae4f3b25e3ee99eaee99d42d
3
+ size 14511
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:329548916d80d2326c3e9113fcfe22537334086ae18a4696a380e612ee2dcea2
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:964c2be91d4357cef5d0efd7d9436b648b6eb7a171890a57465951684d53da2f
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.268686868686869,
5
- "global_step": 280,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -419,11 +419,70 @@
419
  "eval_samples_per_second": 0.061,
420
  "eval_steps_per_second": 0.032,
421
  "step": 280
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
422
  }
423
  ],
424
  "max_steps": 369,
425
  "num_train_epochs": 3,
426
- "total_flos": 1.092630821732352e+16,
427
  "trial_name": null,
428
  "trial_params": null
429
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.591919191919192,
5
+ "global_step": 320,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
419
  "eval_samples_per_second": 0.061,
420
  "eval_steps_per_second": 0.032,
421
  "step": 280
422
+ },
423
+ {
424
+ "epoch": 2.31,
425
+ "learning_rate": 1.1788617886178862e-05,
426
+ "loss": 3.0182,
427
+ "step": 285
428
+ },
429
+ {
430
+ "epoch": 2.35,
431
+ "learning_rate": 1.1111111111111112e-05,
432
+ "loss": 3.4221,
433
+ "step": 290
434
+ },
435
+ {
436
+ "epoch": 2.39,
437
+ "learning_rate": 1.0433604336043361e-05,
438
+ "loss": 3.1717,
439
+ "step": 295
440
+ },
441
+ {
442
+ "epoch": 2.43,
443
+ "learning_rate": 9.756097560975611e-06,
444
+ "loss": 3.309,
445
+ "step": 300
446
+ },
447
+ {
448
+ "epoch": 2.47,
449
+ "learning_rate": 9.078590785907859e-06,
450
+ "loss": 3.215,
451
+ "step": 305
452
+ },
453
+ {
454
+ "epoch": 2.51,
455
+ "learning_rate": 8.401084010840109e-06,
456
+ "loss": 3.2693,
457
+ "step": 310
458
+ },
459
+ {
460
+ "epoch": 2.55,
461
+ "learning_rate": 7.723577235772358e-06,
462
+ "loss": 3.3973,
463
+ "step": 315
464
+ },
465
+ {
466
+ "epoch": 2.59,
467
+ "learning_rate": 7.046070460704607e-06,
468
+ "loss": 3.3138,
469
+ "step": 320
470
+ },
471
+ {
472
+ "epoch": 2.59,
473
+ "eval_loss": 3.127232074737549,
474
+ "eval_rouge2_fmeasure": 0.0,
475
+ "eval_rouge2_precision": 0.0,
476
+ "eval_rouge2_recall": 0.0,
477
+ "eval_runtime": 495.8047,
478
+ "eval_samples_per_second": 0.054,
479
+ "eval_steps_per_second": 0.028,
480
+ "step": 320
481
  }
482
  ],
483
  "max_steps": 369,
484
  "num_train_epochs": 3,
485
+ "total_flos": 1.248720939122688e+16,
486
  "trial_name": null,
487
  "trial_params": null
488
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e431d6677e21cb70645f73a949e7a206eba6b539e4319051fde1cf766602b528
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af7dc2e0c6eac7de952444cda2f8a83b2d8ea1e3e332c7b71d88efa3373715d8
3
  size 1140034381