jasmeeetsingh commited on
Commit
17bbc01
1 Parent(s): e20d2b0

Training in progress, step 4000, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:988222c18e3f64048638d3c02bc08fd31d975a6406a8caceb210af1620d62743
3
  size 2384440
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a7ed0dded696b441337c6a3e02eeeb7025ac5a9dbc38e4beafb2fb8d4e3aacf
3
  size 2384440
last-checkpoint/global_step4000/zero_pp_rank_0_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a351234226b27d25b42376b0ff8df9a62896e17a8d934a01fe74c52c8d52a7b2
3
+ size 3621285613
last-checkpoint/global_step4000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9edabaae742c644df0e2192b75d11539e39adf5895aa12c712657114d495a28a
3
+ size 3542398
last-checkpoint/global_step4000/zero_pp_rank_1_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da6b2634c730dba2bfde3af6588d68bdf73668df35c02556de67da96db21b0b2
3
+ size 3621285613
last-checkpoint/global_step4000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f32e844e2a99d0e8465671f8d2810dfe8c670aa644522df69f39ebb41fc39106
3
+ size 3542398
last-checkpoint/global_step4000/zero_pp_rank_2_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a37138fce80af6355d32448575574e8e43b457fba2e4d35f2192413d14c2540
3
+ size 3621285613
last-checkpoint/global_step4000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29e883eda5fd541cde5c3e2244871466340c4532372861a8dbed80a0cddb79ce
3
+ size 3542398
last-checkpoint/global_step4000/zero_pp_rank_3_mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbe048b5c83d52c0dbb7dc09cf439e2b9523f46d4dc84e04031d52a4a710beb
3
+ size 3621285613
last-checkpoint/global_step4000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebf1317edbc8bb10493e249f63bcb26774f0f7a275a18cd993bf45ed4c5bbb98
3
+ size 3542398
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step3000
 
1
+ global_step4000
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1393a1bd6340e761de7801e9c6f7e59e9706236926efa740dd59227d925a310
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a142dcb9cfde5e88229e3b5ace7328347bbd5e2a82d8de6212af68514991a97
3
  size 17655
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16bc554ee121374c951d62b0801c1c0d7d1548c19e234b64560be1bb9eb187e9
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3f38c9ebf6cbb9cecc2d28d18b8137cbb6f6d9cf4049c5bbfcfbadd33075202
3
  size 17655
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:288fca69a948dbe63f462f084f6093a2adcb386d14c1cdd31b5223788308e476
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2da48feab99508949e07a607af5b17c36501d49c9f1080b4b6ab5d09991e9cf
3
  size 17655
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f85ce05b205ee73adeedec373f739143d8e0b9c49a5a9a8053966c410d6e493a
3
  size 17655
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d52bbf9f211ba1ba80a30cafcb91f904eb2d69ddd99a54b77502b1550f14155
3
  size 17655
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.3455824863174355,
5
  "eval_steps": 500,
6
- "global_step": 3000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -25,13 +25,19 @@
25
  "learning_rate": 0.0001,
26
  "loss": 0.4889,
27
  "step": 3000
 
 
 
 
 
 
28
  }
29
  ],
30
  "logging_steps": 1000,
31
  "max_steps": 12790,
32
  "num_train_epochs": 10,
33
  "save_steps": 1000,
34
- "total_flos": 21870936064000.0,
35
  "trial_name": null,
36
  "trial_params": null
37
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 3.127443315089914,
5
  "eval_steps": 500,
6
+ "global_step": 4000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
25
  "learning_rate": 0.0001,
26
  "loss": 0.4889,
27
  "step": 3000
28
+ },
29
+ {
30
+ "epoch": 3.13,
31
+ "learning_rate": 0.0001,
32
+ "loss": 0.4631,
33
+ "step": 4000
34
  }
35
  ],
36
  "logging_steps": 1000,
37
  "max_steps": 12790,
38
  "num_train_epochs": 10,
39
  "save_steps": 1000,
40
+ "total_flos": 29206081699840.0,
41
  "trial_name": null,
42
  "trial_params": null
43
  }