hofarah commited on
Commit
52b0df6
1 Parent(s): c46a08f

Training in progress, step 80

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f74d5f1a45d708b38e5462a32098619a77d216416ff27973af946caa6c7fbf36
3
  size 3544920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dbb11a70fcae64bec104647c5acced3c0cd79c0b44ee82b6f3f250254ec5e50
3
  size 3544920
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7ebbce591f251737d83478299d728e89bf21826c0f2b1592542f198360b0762
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276032cb589b04e8986400fdcfd96f9c2efadabf7a09d727dbe49fe1f4f6afbe
3
  size 1140034381
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d74287cececdc4f6ced3ef29c8a8d27ff10637de332defa7d4dbb07c0865050
3
- size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04ae77db66de79b69f8a3d821bbb733e237d660fa8765e0a2763c1fceddcd297
3
+ size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7345e2891e6c7505609bb455ba0e660aaff504ba8618e8322a39b4afd34a7832
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ecf13dfb953ccd15ae617ed9a359fdf95573284a2df37f02a60ab75ef4e68b6
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.32323232323232326,
5
- "global_step": 40,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -65,11 +65,70 @@
65
  "eval_samples_per_second": 0.15,
66
  "eval_steps_per_second": 0.078,
67
  "step": 40
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
68
  }
69
  ],
70
  "max_steps": 369,
71
  "num_train_epochs": 3,
72
- "total_flos": 1560901173903360.0,
73
  "trial_name": null,
74
  "trial_params": null
75
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.6464646464646465,
5
+ "global_step": 80,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
65
  "eval_samples_per_second": 0.15,
66
  "eval_steps_per_second": 0.078,
67
  "step": 40
68
+ },
69
+ {
70
+ "epoch": 0.36,
71
+ "learning_rate": 4.4037940379403794e-05,
72
+ "loss": 3.5264,
73
+ "step": 45
74
+ },
75
+ {
76
+ "epoch": 0.4,
77
+ "learning_rate": 4.336043360433605e-05,
78
+ "loss": 3.6286,
79
+ "step": 50
80
+ },
81
+ {
82
+ "epoch": 0.44,
83
+ "learning_rate": 4.26829268292683e-05,
84
+ "loss": 3.4611,
85
+ "step": 55
86
+ },
87
+ {
88
+ "epoch": 0.48,
89
+ "learning_rate": 4.2005420054200545e-05,
90
+ "loss": 3.9319,
91
+ "step": 60
92
+ },
93
+ {
94
+ "epoch": 0.53,
95
+ "learning_rate": 4.132791327913279e-05,
96
+ "loss": 3.7751,
97
+ "step": 65
98
+ },
99
+ {
100
+ "epoch": 0.57,
101
+ "learning_rate": 4.065040650406504e-05,
102
+ "loss": 3.6241,
103
+ "step": 70
104
+ },
105
+ {
106
+ "epoch": 0.61,
107
+ "learning_rate": 3.9972899728997295e-05,
108
+ "loss": 3.3906,
109
+ "step": 75
110
+ },
111
+ {
112
+ "epoch": 0.65,
113
+ "learning_rate": 3.9295392953929537e-05,
114
+ "loss": 3.1815,
115
+ "step": 80
116
+ },
117
+ {
118
+ "epoch": 0.65,
119
+ "eval_loss": 3.189028739929199,
120
+ "eval_rouge2_fmeasure": 0.0,
121
+ "eval_rouge2_precision": 0.0,
122
+ "eval_rouge2_recall": 0.0,
123
+ "eval_runtime": 265.9332,
124
+ "eval_samples_per_second": 0.102,
125
+ "eval_steps_per_second": 0.053,
126
+ "step": 80
127
  }
128
  ],
129
  "max_steps": 369,
130
  "num_train_epochs": 3,
131
+ "total_flos": 3121802347806720.0,
132
  "trial_name": null,
133
  "trial_params": null
134
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c7ebbce591f251737d83478299d728e89bf21826c0f2b1592542f198360b0762
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276032cb589b04e8986400fdcfd96f9c2efadabf7a09d727dbe49fe1f4f6afbe
3
  size 1140034381