Mithilss commited on
Commit
b7afdf4
1 Parent(s): 8f2985c

End of training

Browse files
README.md CHANGED
@@ -34,10 +34,10 @@ More information needed
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0003
37
- - train_batch_size: 2
38
  - eval_batch_size: 8
39
  - seed: 42
40
- - gradient_accumulation_steps: 4
41
  - total_train_batch_size: 8
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: linear
 
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0003
37
+ - train_batch_size: 1
38
  - eval_batch_size: 8
39
  - seed: 42
40
+ - gradient_accumulation_steps: 8
41
  - total_train_batch_size: 8
42
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
43
  - lr_scheduler_type: linear
adapter_config.json CHANGED
@@ -11,16 +11,16 @@
11
  "lora_dropout": 0.0,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
- "r": 8,
15
  "revision": null,
16
  "target_modules": [
17
  "down_proj",
 
18
  "gate_proj",
19
  "k_proj",
20
- "v_proj",
21
  "q_proj",
22
  "up_proj",
23
- "o_proj"
24
  ],
25
  "task_type": "CAUSAL_LM"
26
  }
 
11
  "lora_dropout": 0.0,
12
  "modules_to_save": null,
13
  "peft_type": "LORA",
14
+ "r": 16,
15
  "revision": null,
16
  "target_modules": [
17
  "down_proj",
18
+ "o_proj",
19
  "gate_proj",
20
  "k_proj",
 
21
  "q_proj",
22
  "up_proj",
23
+ "v_proj"
24
  ],
25
  "task_type": "CAUSAL_LM"
26
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a9ada0c0165015c8d9d417ac280537b96af25ee8bd2b1c6b7487f8e6b2c0fa3e
3
- size 30026872
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5726e7adba0ffa9bd5595d9805747c225cdbccd48b3b09dd166de2cd030c8c14
3
+ size 60010048
runs/Feb28_21-47-26_MithilAIPC/events.out.tfevents.1709137063.MithilAIPC.21972.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afafafb319e4575efe8b3adf127667590d8d8e6a66cc2119abcd1cee2dcd12c4
3
+ size 61640
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa16865030827f9fad3a591dca26dada37f9eaf1064fed7d73acf24a10266580
3
  size 5048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b14540e54927bf4ada65bb0a09730d1638b1954faa287b90513f0b43eba12172
3
  size 5048