Femboyuwu2000 commited on
Commit
a34dff5
1 Parent(s): 481b4b2

Training in progress, step 60, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -1,9 +1,6 @@
1
  {
2
  "alpha_pattern": {},
3
- "auto_mapping": {
4
- "base_model_class": "BloomForCausalLM",
5
- "parent_library": "transformers.models.bloom.modeling_bloom"
6
- },
7
  "base_model_name_or_path": "bigscience/bloomz-1b1",
8
  "bias": "none",
9
  "fan_in_fan_out": false,
@@ -26,7 +23,7 @@
26
  "query_key_valuelm_head",
27
  "word_embeddings"
28
  ],
29
- "task_type": null,
30
  "use_dora": false,
31
  "use_rslora": false
32
  }
 
1
  {
2
  "alpha_pattern": {},
3
+ "auto_mapping": null,
 
 
 
4
  "base_model_name_or_path": "bigscience/bloomz-1b1",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
 
23
  "query_key_valuelm_head",
24
  "word_embeddings"
25
  ],
26
+ "task_type": "CAUSAL_LM",
27
  "use_dora": false,
28
  "use_rslora": false
29
  }
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:270f7a985c38ef87d3b0c62d407b8c8e1e8a69c4b0b3fcff9cbdaefb08b99e6e
3
  size 8077608
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de52612f18d94eb85267cdbaa87cfac914b5a3415370220f048ff6627b5dc973
3
  size 8077608
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:982d07f785f45a60ecb772290342d804c23af42b43a0e9ec31f36d884de5be86
3
  size 4052500
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7da0cccb26e635a9bb8fe359b98f58b1fe7d55939c5f6f51514ca872caa19e9
3
  size 4052500
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:384b1441690cc32db0a09ece90eb10816e434402fb6deac7559104dc40fcf585
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:386fcc8cc1089aade9450d86fb239ea3483f455fd2d78d8378645feecfec9d69
3
  size 14244
last-checkpoint/trainer_state.json CHANGED
@@ -10,23 +10,23 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
- "grad_norm": 103.39625549316406,
14
  "learning_rate": 2.341780598043574e-05,
15
- "loss": 4.678,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 0.0,
20
- "grad_norm": 248.84193420410156,
21
  "learning_rate": 7.97387338950315e-06,
22
- "loss": 4.5269,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 0.0,
27
- "grad_norm": 73.25434112548828,
28
  "learning_rate": 0.0,
29
- "loss": 4.8386,
30
  "step": 60
31
  }
32
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.0,
13
+ "grad_norm": 87.1609115600586,
14
  "learning_rate": 2.341780598043574e-05,
15
+ "loss": 4.6745,
16
  "step": 20
17
  },
18
  {
19
  "epoch": 0.0,
20
+ "grad_norm": 226.922119140625,
21
  "learning_rate": 7.97387338950315e-06,
22
+ "loss": 4.5875,
23
  "step": 40
24
  },
25
  {
26
  "epoch": 0.0,
27
+ "grad_norm": 86.45769500732422,
28
  "learning_rate": 0.0,
29
+ "loss": 4.8834,
30
  "step": 60
31
  }
32
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:439f3807656f67fbb80a340aba983b1e64e3589ce5602b15e2abaffb2bc57416
3
  size 4984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83256b55088d45d0ebeda1319a91e9b247c70b5f4d82cb04a018aa4a684554bc
3
  size 4984