yizhujiao commited on
Commit
efdefe5
1 Parent(s): 9d80ce8

Training in progress, step 500

Browse files
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd06b631ae0e175719fa7925d2c9357fc164b0f5c3f94110f0591a96f4b48aad
3
- size 4230006368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2edcfe5c3d4ee172d27acc9814de45f14cbaaaa1b3caf9237d049d33a43cf08
3
+ size 27280152
special_tokens_map.json CHANGED
@@ -14,7 +14,7 @@
14
  "single_word": false
15
  },
16
  "pad_token": {
17
- "content": "<|pad|>",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
 
14
  "single_word": false
15
  },
16
  "pad_token": {
17
+ "content": "[PAD]",
18
  "lstrip": false,
19
  "normalized": false,
20
  "rstrip": false,
tokenizer.json CHANGED
@@ -2309,7 +2309,7 @@
2309
  },
2310
  {
2311
  "id": 128256,
2312
- "content": "<|pad|>",
2313
  "single_word": false,
2314
  "lstrip": false,
2315
  "rstrip": false,
@@ -2338,69 +2338,85 @@
2338
  ]
2339
  },
2340
  "post_processor": {
2341
- "type": "Sequence",
2342
- "processors": [
2343
  {
2344
- "type": "ByteLevel",
2345
- "add_prefix_space": true,
2346
- "trim_offsets": false,
2347
- "use_regex": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2348
  },
2349
  {
2350
- "type": "TemplateProcessing",
2351
- "single": [
2352
- {
2353
- "SpecialToken": {
2354
- "id": "<|begin_of_text|>",
2355
- "type_id": 0
2356
- }
2357
- },
2358
- {
2359
- "Sequence": {
2360
- "id": "A",
2361
- "type_id": 0
2362
- }
2363
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2364
  ],
2365
- "pair": [
2366
- {
2367
- "SpecialToken": {
2368
- "id": "<|begin_of_text|>",
2369
- "type_id": 0
2370
- }
2371
- },
2372
- {
2373
- "Sequence": {
2374
- "id": "A",
2375
- "type_id": 0
2376
- }
2377
- },
2378
- {
2379
- "SpecialToken": {
2380
- "id": "<|begin_of_text|>",
2381
- "type_id": 1
2382
- }
2383
- },
2384
- {
2385
- "Sequence": {
2386
- "id": "B",
2387
- "type_id": 1
2388
- }
2389
- }
2390
  ],
2391
- "special_tokens": {
2392
- "<|begin_of_text|>": {
2393
- "id": "<|begin_of_text|>",
2394
- "ids": [
2395
- 128000
2396
- ],
2397
- "tokens": [
2398
- "<|begin_of_text|>"
2399
- ]
2400
- }
2401
- }
2402
  }
2403
- ]
2404
  },
2405
  "decoder": {
2406
  "type": "ByteLevel",
 
2309
  },
2310
  {
2311
  "id": 128256,
2312
+ "content": "[PAD]",
2313
  "single_word": false,
2314
  "lstrip": false,
2315
  "rstrip": false,
 
2338
  ]
2339
  },
2340
  "post_processor": {
2341
+ "type": "TemplateProcessing",
2342
+ "single": [
2343
  {
2344
+ "SpecialToken": {
2345
+ "id": "<|begin_of_text|>",
2346
+ "type_id": 0
2347
+ }
2348
+ },
2349
+ {
2350
+ "Sequence": {
2351
+ "id": "A",
2352
+ "type_id": 0
2353
+ }
2354
+ },
2355
+ {
2356
+ "SpecialToken": {
2357
+ "id": "<|eot_id|>",
2358
+ "type_id": 0
2359
+ }
2360
+ }
2361
+ ],
2362
+ "pair": [
2363
+ {
2364
+ "SpecialToken": {
2365
+ "id": "<|begin_of_text|>",
2366
+ "type_id": 0
2367
+ }
2368
+ },
2369
+ {
2370
+ "Sequence": {
2371
+ "id": "A",
2372
+ "type_id": 0
2373
+ }
2374
  },
2375
  {
2376
+ "SpecialToken": {
2377
+ "id": "<|eot_id|>",
2378
+ "type_id": 0
2379
+ }
2380
+ },
2381
+ {
2382
+ "SpecialToken": {
2383
+ "id": "<|begin_of_text|>",
2384
+ "type_id": 1
2385
+ }
2386
+ },
2387
+ {
2388
+ "Sequence": {
2389
+ "id": "B",
2390
+ "type_id": 1
2391
+ }
2392
+ },
2393
+ {
2394
+ "SpecialToken": {
2395
+ "id": "<|eot_id|>",
2396
+ "type_id": 1
2397
+ }
2398
+ }
2399
+ ],
2400
+ "special_tokens": {
2401
+ "<|begin_of_text|>": {
2402
+ "id": "<|begin_of_text|>",
2403
+ "ids": [
2404
+ 128000
2405
  ],
2406
+ "tokens": [
2407
+ "<|begin_of_text|>"
2408
+ ]
2409
+ },
2410
+ "<|eot_id|>": {
2411
+ "id": "<|eot_id|>",
2412
+ "ids": [
2413
+ 128009
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2414
  ],
2415
+ "tokens": [
2416
+ "<|eot_id|>"
2417
+ ]
 
 
 
 
 
 
 
 
2418
  }
2419
+ }
2420
  },
2421
  "decoder": {
2422
  "type": "ByteLevel",
tokenizer_config.json CHANGED
@@ -2050,7 +2050,7 @@
2050
  "special": true
2051
  },
2052
  "128256": {
2053
- "content": "<|pad|>",
2054
  "lstrip": false,
2055
  "normalized": false,
2056
  "rstrip": false,
@@ -2067,6 +2067,6 @@
2067
  "attention_mask"
2068
  ],
2069
  "model_max_length": 1000000000000000019884624838656,
2070
- "pad_token": "<|pad|>",
2071
  "tokenizer_class": "PreTrainedTokenizerFast"
2072
  }
 
2050
  "special": true
2051
  },
2052
  "128256": {
2053
+ "content": "[PAD]",
2054
  "lstrip": false,
2055
  "normalized": false,
2056
  "rstrip": false,
 
2067
  "attention_mask"
2068
  ],
2069
  "model_max_length": 1000000000000000019884624838656,
2070
+ "pad_token": "[PAD]",
2071
  "tokenizer_class": "PreTrainedTokenizerFast"
2072
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c357fe17f15f6fd7f122fe76192d627bbbcb93c64265ccbd73be5de80a67b09
3
- size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de903dff6a4584879db6512a2b3cd907b4d6a195d14e6c049cc8a18e0c6a0fa3
3
+ size 5432