hofarah commited on
Commit
6bf6cda
1 Parent(s): 52b0df6

Training in progress, step 120

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3dbb11a70fcae64bec104647c5acced3c0cd79c0b44ee82b6f3f250254ec5e50
3
  size 3544920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dee7c0b39ba072977a286772c0af8b9fc2500ede55b83bc1199a158f6dfc1722
3
  size 3544920
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:276032cb589b04e8986400fdcfd96f9c2efadabf7a09d727dbe49fe1f4f6afbe
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a11f66a4c84be3caa48c29e8c74885ea6b56dddb765149269bfd08b8903328
3
  size 1140034381
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04ae77db66de79b69f8a3d821bbb733e237d660fa8765e0a2763c1fceddcd297
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ac223aa8ee652f038edd3082fd2a44bd13436ca909976cb75fcc2c2108ab8b1
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ecf13dfb953ccd15ae617ed9a359fdf95573284a2df37f02a60ab75ef4e68b6
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f83af140ab0aa237edb30d0fe7c12244f0dd58eccf65131d8908858944652ecc
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.6464646464646465,
5
- "global_step": 80,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -124,11 +124,70 @@
124
  "eval_samples_per_second": 0.102,
125
  "eval_steps_per_second": 0.053,
126
  "step": 80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
127
  }
128
  ],
129
  "max_steps": 369,
130
  "num_train_epochs": 3,
131
- "total_flos": 3121802347806720.0,
132
  "trial_name": null,
133
  "trial_params": null
134
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9696969696969697,
5
+ "global_step": 120,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
124
  "eval_samples_per_second": 0.102,
125
  "eval_steps_per_second": 0.053,
126
  "step": 80
127
+ },
128
+ {
129
+ "epoch": 0.69,
130
+ "learning_rate": 3.861788617886179e-05,
131
+ "loss": 3.3673,
132
+ "step": 85
133
+ },
134
+ {
135
+ "epoch": 0.73,
136
+ "learning_rate": 3.794037940379404e-05,
137
+ "loss": 3.3792,
138
+ "step": 90
139
+ },
140
+ {
141
+ "epoch": 0.77,
142
+ "learning_rate": 3.726287262872629e-05,
143
+ "loss": 3.5732,
144
+ "step": 95
145
+ },
146
+ {
147
+ "epoch": 0.81,
148
+ "learning_rate": 3.6585365853658535e-05,
149
+ "loss": 3.2772,
150
+ "step": 100
151
+ },
152
+ {
153
+ "epoch": 0.85,
154
+ "learning_rate": 3.6043360433604336e-05,
155
+ "loss": 3.3803,
156
+ "step": 105
157
+ },
158
+ {
159
+ "epoch": 0.89,
160
+ "learning_rate": 3.5365853658536584e-05,
161
+ "loss": 3.2597,
162
+ "step": 110
163
+ },
164
+ {
165
+ "epoch": 0.93,
166
+ "learning_rate": 3.468834688346884e-05,
167
+ "loss": 3.4085,
168
+ "step": 115
169
+ },
170
+ {
171
+ "epoch": 0.97,
172
+ "learning_rate": 3.401084010840109e-05,
173
+ "loss": 3.2319,
174
+ "step": 120
175
+ },
176
+ {
177
+ "epoch": 0.97,
178
+ "eval_loss": 3.166618824005127,
179
+ "eval_rouge2_fmeasure": 0.0,
180
+ "eval_rouge2_precision": 0.0,
181
+ "eval_rouge2_recall": 0.0,
182
+ "eval_runtime": 433.3435,
183
+ "eval_samples_per_second": 0.062,
184
+ "eval_steps_per_second": 0.032,
185
+ "step": 120
186
  }
187
  ],
188
  "max_steps": 369,
189
  "num_train_epochs": 3,
190
+ "total_flos": 4682703521710080.0,
191
  "trial_name": null,
192
  "trial_params": null
193
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:276032cb589b04e8986400fdcfd96f9c2efadabf7a09d727dbe49fe1f4f6afbe
3
  size 1140034381
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66a11f66a4c84be3caa48c29e8c74885ea6b56dddb765149269bfd08b8903328
3
  size 1140034381