ryper1 commited on
Commit
b57c599
1 Parent(s): 9a5bc15

Training in progress, epoch 1

Browse files
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "meta-llama/Meta-Llama-3-8B-Instruct",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "k_proj",
24
  "q_proj",
 
 
25
  "v_proj",
 
26
  "down_proj",
27
- "gate_proj",
28
- "o_proj",
29
- "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "meta-llama/Meta-Llama-3-70B-Instruct",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "q_proj",
24
+ "gate_proj",
25
+ "k_proj",
26
  "v_proj",
27
+ "up_proj",
28
  "down_proj",
29
+ "o_proj"
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95551f9b0cef452e81324c61fde9601d5b242da988dbcb552daae1cba2688c02
3
- size 3443619040
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdb9f0d2b845f9c6d865e33135df5b987073982d9c8c1146b07eadcf9c2c548c
3
+ size 17456914576
runs/Sep09_10-46-24_lxn-ejplab/events.out.tfevents.1725893205.lxn-ejplab ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:029bce1140d688cb30f24f05868d44f1ae14480bcec78aec348b0ead6915f17a
3
+ size 5881
runs/Sep09_10-51-58_lxn-ejplab/events.out.tfevents.1725893539.lxn-ejplab ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62b72a64fde2494b49dee0a4d918c91b3226cb9124cac89a3016bf2c08611142
3
+ size 5881
runs/Sep09_10-56-12_lxn-ejplab/events.out.tfevents.1725893793.lxn-ejplab ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b754a3ffbf81057f04588273e68bd3c513e374b57e5c1a334f7fda6ffdd4da7d
3
+ size 6709
special_tokens_map.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "additional_special_tokens": [
3
  {
4
- "content": "<|im_end|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
- "content": "<|im_start|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
 
1
  {
2
  "additional_special_tokens": [
3
  {
4
+ "content": "<|im_start|>",
5
  "lstrip": false,
6
  "normalized": false,
7
  "rstrip": false,
8
  "single_word": false
9
  },
10
  {
11
+ "content": "<|im_end|>",
12
  "lstrip": false,
13
  "normalized": false,
14
  "rstrip": false,
tokenizer.json CHANGED
@@ -2309,7 +2309,7 @@
2309
  },
2310
  {
2311
  "id": 128256,
2312
- "content": "<|im_end|>",
2313
  "single_word": false,
2314
  "lstrip": false,
2315
  "rstrip": false,
@@ -2318,7 +2318,7 @@
2318
  },
2319
  {
2320
  "id": 128257,
2321
- "content": "<|im_start|>",
2322
  "single_word": false,
2323
  "lstrip": false,
2324
  "rstrip": false,
@@ -2425,6 +2425,7 @@
2425
  "end_of_word_suffix": null,
2426
  "fuse_unk": false,
2427
  "byte_fallback": false,
 
2428
  "vocab": {
2429
  "!": 0,
2430
  "\"": 1,
 
2309
  },
2310
  {
2311
  "id": 128256,
2312
+ "content": "<|im_start|>",
2313
  "single_word": false,
2314
  "lstrip": false,
2315
  "rstrip": false,
 
2318
  },
2319
  {
2320
  "id": 128257,
2321
+ "content": "<|im_end|>",
2322
  "single_word": false,
2323
  "lstrip": false,
2324
  "rstrip": false,
 
2425
  "end_of_word_suffix": null,
2426
  "fuse_unk": false,
2427
  "byte_fallback": false,
2428
+ "ignore_merges": true,
2429
  "vocab": {
2430
  "!": 0,
2431
  "\"": 1,
tokenizer_config.json CHANGED
@@ -2049,7 +2049,7 @@
2049
  "special": true
2050
  },
2051
  "128256": {
2052
- "content": "<|im_end|>",
2053
  "lstrip": false,
2054
  "normalized": false,
2055
  "rstrip": false,
@@ -2057,7 +2057,7 @@
2057
  "special": true
2058
  },
2059
  "128257": {
2060
- "content": "<|im_start|>",
2061
  "lstrip": false,
2062
  "normalized": false,
2063
  "rstrip": false,
@@ -2066,8 +2066,8 @@
2066
  }
2067
  },
2068
  "additional_special_tokens": [
2069
- "<|im_end|>",
2070
- "<|im_start|>"
2071
  ],
2072
  "bos_token": "<|im_start|>",
2073
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
 
2049
  "special": true
2050
  },
2051
  "128256": {
2052
+ "content": "<|im_start|>",
2053
  "lstrip": false,
2054
  "normalized": false,
2055
  "rstrip": false,
 
2057
  "special": true
2058
  },
2059
  "128257": {
2060
+ "content": "<|im_end|>",
2061
  "lstrip": false,
2062
  "normalized": false,
2063
  "rstrip": false,
 
2066
  }
2067
  },
2068
  "additional_special_tokens": [
2069
+ "<|im_start|>",
2070
+ "<|im_end|>"
2071
  ],
2072
  "bos_token": "<|im_start|>",
2073
  "chat_template": "{% for message in messages %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10abe1dc050642c6751f84c7a454c06a3326eae745a3c445cce01f75b7edaafa
3
- size 4283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0171d5032677484029dfd2bc3a9aab38c0b75ae12ce291b139b9977ad0d580f
3
+ size 5560