MohamedAhmedAE commited on
Commit
3127737
1 Parent(s): bcca07c

Training in progress, step 2500, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1355a0456315e38ddd4e5bb14d13f3e60daf4a83eb0200f06f8ad70651e2671e
3
  size 1342238560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e113b4f4f7380ea91be321d7eb224a1892c29690b499cf104edbc1033fe5b04
3
  size 1342238560
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7573892481b9fc959cbab3bd079cfad71612c44c3de992eb02dd0ddb993d15b
3
  size 2852574238
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa6dff968ebc536d935f20500dfd3266e442e6914d65f9452ccde2523c539a55
3
  size 2852574238
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2de1ff0ec7b4f73410478352e0bc1e361ac7d425afa69cd020451718a9b7ad4
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d23adb5f8b168d9bd8854c7c24a982a4c7bb6c53373bc21471b5f28d834d745
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:15a8ae873ae1ad723f4506548bbe03017c25276924eb215dbc4422a986eb89bc
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ac3968049235612001c3413dd650a780dde8f9dab2897c02f639abe7251f8ed
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.1601067378252168,
5
  "eval_steps": 500,
6
- "global_step": 2400,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -207,6 +207,21 @@
207
  "learning_rate": 0.00019999787116827252,
208
  "loss": 2.4247,
209
  "step": 2400
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
210
  }
211
  ],
212
  "logging_steps": 100,
@@ -226,7 +241,7 @@
226
  "attributes": {}
227
  }
228
  },
229
- "total_flos": 4.866978990698496e+16,
230
  "train_batch_size": 4,
231
  "trial_name": null,
232
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.1667778519012675,
5
  "eval_steps": 500,
6
+ "global_step": 2500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
207
  "learning_rate": 0.00019999787116827252,
208
  "loss": 2.4247,
209
  "step": 2400
210
+ },
211
+ {
212
+ "epoch": 0.1667778519012675,
213
+ "grad_norm": 6.1392998695373535,
214
+ "learning_rate": 0.00019999411790321993,
215
+ "loss": 2.4662,
216
+ "step": 2500
217
+ },
218
+ {
219
+ "epoch": 0.1667778519012675,
220
+ "eval_loss": 2.4712343215942383,
221
+ "eval_runtime": 4209.0065,
222
+ "eval_samples_per_second": 2.353,
223
+ "eval_steps_per_second": 1.177,
224
+ "step": 2500
225
  }
226
  ],
227
  "logging_steps": 100,
 
241
  "attributes": {}
242
  }
243
  },
244
+ "total_flos": 5.065745562277478e+16,
245
  "train_batch_size": 4,
246
  "trial_name": null,
247
  "trial_params": null