Training in progress, step 60, checkpoint

Files changed (6) hide show

last-checkpoint/adapter_config.json CHANGED Viewed

@@ -1,9 +1,6 @@
 {
   "alpha_pattern": {},
-  "auto_mapping": {
-    "base_model_class": "BloomForCausalLM",
-    "parent_library": "transformers.models.bloom.modeling_bloom"
-  },
   "base_model_name_or_path": "bigscience/bloomz-1b1",
   "bias": "none",
   "fan_in_fan_out": false,
@@ -26,7 +23,7 @@
     "query_key_valuelm_head",
     "word_embeddings"
   ],
-  "task_type": null,
   "use_dora": false,
   "use_rslora": false
 }

 {
   "alpha_pattern": {},
+  "auto_mapping": null,
   "base_model_name_or_path": "bigscience/bloomz-1b1",
   "bias": "none",
   "fan_in_fan_out": false,
     "query_key_valuelm_head",
     "word_embeddings"
   ],
+  "task_type": "CAUSAL_LM",
   "use_dora": false,
   "use_rslora": false
 }

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:270f7a985c38ef87d3b0c62d407b8c8e1e8a69c4b0b3fcff9cbdaefb08b99e6e
 size 8077608

 version https://git-lfs.github.com/spec/v1
+oid sha256:de52612f18d94eb85267cdbaa87cfac914b5a3415370220f048ff6627b5dc973
 size 8077608

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:982d07f785f45a60ecb772290342d804c23af42b43a0e9ec31f36d884de5be86
 size 4052500

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7da0cccb26e635a9bb8fe359b98f58b1fe7d55939c5f6f51514ca872caa19e9
 size 4052500

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:384b1441690cc32db0a09ece90eb10816e434402fb6deac7559104dc40fcf585
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:386fcc8cc1089aade9450d86fb239ea3483f455fd2d78d8378645feecfec9d69
 size 14244

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -10,23 +10,23 @@
   "log_history": [
     {
       "epoch": 0.0,
-      "grad_norm": 103.39625549316406,
       "learning_rate": 2.341780598043574e-05,
-      "loss": 4.678,
       "step": 20
     },
     {
       "epoch": 0.0,
-      "grad_norm": 248.84193420410156,
       "learning_rate": 7.97387338950315e-06,
-      "loss": 4.5269,
       "step": 40
     },
     {
       "epoch": 0.0,
-      "grad_norm": 73.25434112548828,
       "learning_rate": 0.0,
-      "loss": 4.8386,
       "step": 60
     }
   ],

   "log_history": [
     {
       "epoch": 0.0,
+      "grad_norm": 87.1609115600586,
       "learning_rate": 2.341780598043574e-05,
+      "loss": 4.6745,
       "step": 20
     },
     {
       "epoch": 0.0,
+      "grad_norm": 226.922119140625,
       "learning_rate": 7.97387338950315e-06,
+      "loss": 4.5875,
       "step": 40
     },
     {
       "epoch": 0.0,
+      "grad_norm": 86.45769500732422,
       "learning_rate": 0.0,
+      "loss": 4.8834,
       "step": 60
     }
   ],

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:439f3807656f67fbb80a340aba983b1e64e3589ce5602b15e2abaffb2bc57416
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:83256b55088d45d0ebeda1319a91e9b247c70b5f4d82cb04a018aa4a684554bc
 size 4984