flytech commited on
Commit
c7dc115
1 Parent(s): f269569

Training in progress, step 1000, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8776e463dfb2fb241b207dcf6f197b8bcc48d01c1573dc9e37df7cf649be1f5
3
  size 160285149
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a91c94a3317d424396cebab93b82a8c58b613fe4abf0d6fcffd5315b8502bb89
3
  size 160285149
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:167de084d9751ce323bad469c1dc3226ac11b692074ae311e213a15b0836b0ac
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1f4e39da86dc5867b7d3c7f30f9588fe7974d19848a0aea34e0df4cde8b3932
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60f4fa52f793b7ffd9d5a0e3203e96f72580141d20eac3efe05c0fac6521a8ec
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ed2d4b131d874aa658f97c179cbc7aae45ebbdf63422dc95963b45fededa2b1
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.3333333333333333,
5
  "eval_steps": 100,
6
- "global_step": 900,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -124,13 +124,26 @@
124
  "eval_samples_per_second": 1.905,
125
  "eval_steps_per_second": 0.239,
126
  "step": 900
 
 
 
 
 
 
 
 
 
 
 
 
 
127
  }
128
  ],
129
  "logging_steps": 100,
130
  "max_steps": 2025,
131
  "num_train_epochs": 3,
132
  "save_steps": 100,
133
- "total_flos": 1.87416358944768e+17,
134
  "trial_name": null,
135
  "trial_params": null
136
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.4814814814814814,
5
  "eval_steps": 100,
6
+ "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
124
  "eval_samples_per_second": 1.905,
125
  "eval_steps_per_second": 0.239,
126
  "step": 900
127
+ },
128
+ {
129
+ "epoch": 1.48,
130
+ "learning_rate": 0.0,
131
+ "loss": 8.5777,
132
+ "step": 1000
133
+ },
134
+ {
135
+ "epoch": 1.48,
136
+ "eval_runtime": 787.2473,
137
+ "eval_samples_per_second": 1.905,
138
+ "eval_steps_per_second": 0.239,
139
+ "step": 1000
140
  }
141
  ],
142
  "logging_steps": 100,
143
  "max_steps": 2025,
144
  "num_train_epochs": 3,
145
  "save_steps": 100,
146
+ "total_flos": 2.0824039882752e+17,
147
  "trial_name": null,
148
  "trial_params": null
149
  }