yizhujiao commited on
Commit
9100c07
1 Parent(s): 66e5423

Training in progress, step 500

Browse files
adapter_config.json CHANGED
@@ -20,8 +20,8 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "q_proj",
24
- "v_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "v_proj",
24
+ "q_proj"
25
  ],
26
  "task_type": "CAUSAL_LM",
27
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd21bce58cd6f1b67a46c5ba4b28deb9dab27e678803f0cd87d59f12ae39d542
3
- size 27280152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da0266b2d829ae02c56e186cd54539d8ca0b43464b683a51d1c85423ba4cb5d1
3
+ size 4230006368
tokenizer.json CHANGED
@@ -2338,85 +2338,69 @@
2338
  ]
2339
  },
2340
  "post_processor": {
2341
- "type": "TemplateProcessing",
2342
- "single": [
2343
- {
2344
- "SpecialToken": {
2345
- "id": "<|begin_of_text|>",
2346
- "type_id": 0
2347
- }
2348
- },
2349
- {
2350
- "Sequence": {
2351
- "id": "A",
2352
- "type_id": 0
2353
- }
2354
- },
2355
- {
2356
- "SpecialToken": {
2357
- "id": "<|eot_id|>",
2358
- "type_id": 0
2359
- }
2360
- }
2361
- ],
2362
- "pair": [
2363
- {
2364
- "SpecialToken": {
2365
- "id": "<|begin_of_text|>",
2366
- "type_id": 0
2367
- }
2368
- },
2369
- {
2370
- "Sequence": {
2371
- "id": "A",
2372
- "type_id": 0
2373
- }
2374
- },
2375
- {
2376
- "SpecialToken": {
2377
- "id": "<|eot_id|>",
2378
- "type_id": 0
2379
- }
2380
- },
2381
- {
2382
- "SpecialToken": {
2383
- "id": "<|begin_of_text|>",
2384
- "type_id": 1
2385
- }
2386
- },
2387
  {
2388
- "Sequence": {
2389
- "id": "B",
2390
- "type_id": 1
2391
- }
2392
  },
2393
  {
2394
- "SpecialToken": {
2395
- "id": "<|eot_id|>",
2396
- "type_id": 1
2397
- }
2398
- }
2399
- ],
2400
- "special_tokens": {
2401
- "<|begin_of_text|>": {
2402
- "id": "<|begin_of_text|>",
2403
- "ids": [
2404
- 128000
 
 
 
2405
  ],
2406
- "tokens": [
2407
- "<|begin_of_text|>"
2408
- ]
2409
- },
2410
- "<|eot_id|>": {
2411
- "id": "<|eot_id|>",
2412
- "ids": [
2413
- 128009
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2414
  ],
2415
- "tokens": [
2416
- "<|eot_id|>"
2417
- ]
 
 
 
 
 
 
 
 
2418
  }
2419
- }
2420
  },
2421
  "decoder": {
2422
  "type": "ByteLevel",
 
2338
  ]
2339
  },
2340
  "post_processor": {
2341
+ "type": "Sequence",
2342
+ "processors": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2343
  {
2344
+ "type": "ByteLevel",
2345
+ "add_prefix_space": true,
2346
+ "trim_offsets": false,
2347
+ "use_regex": true
2348
  },
2349
  {
2350
+ "type": "TemplateProcessing",
2351
+ "single": [
2352
+ {
2353
+ "SpecialToken": {
2354
+ "id": "<|begin_of_text|>",
2355
+ "type_id": 0
2356
+ }
2357
+ },
2358
+ {
2359
+ "Sequence": {
2360
+ "id": "A",
2361
+ "type_id": 0
2362
+ }
2363
+ }
2364
  ],
2365
+ "pair": [
2366
+ {
2367
+ "SpecialToken": {
2368
+ "id": "<|begin_of_text|>",
2369
+ "type_id": 0
2370
+ }
2371
+ },
2372
+ {
2373
+ "Sequence": {
2374
+ "id": "A",
2375
+ "type_id": 0
2376
+ }
2377
+ },
2378
+ {
2379
+ "SpecialToken": {
2380
+ "id": "<|begin_of_text|>",
2381
+ "type_id": 1
2382
+ }
2383
+ },
2384
+ {
2385
+ "Sequence": {
2386
+ "id": "B",
2387
+ "type_id": 1
2388
+ }
2389
+ }
2390
  ],
2391
+ "special_tokens": {
2392
+ "<|begin_of_text|>": {
2393
+ "id": "<|begin_of_text|>",
2394
+ "ids": [
2395
+ 128000
2396
+ ],
2397
+ "tokens": [
2398
+ "<|begin_of_text|>"
2399
+ ]
2400
+ }
2401
+ }
2402
  }
2403
+ ]
2404
  },
2405
  "decoder": {
2406
  "type": "ByteLevel",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de903dff6a4584879db6512a2b3cd907b4d6a195d14e6c049cc8a18e0c6a0fa3
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b14d20c6c5e870f0b338575500fa87c2941961ec67d884d28da36335032f79f
3
  size 5432