euclaise commited on
Commit
4ffd090
1 Parent(s): 7ee2243

Upload tokenizer

Browse files
Files changed (2) hide show
  1. README.md +5 -5
  2. tokenizer_config.json +1 -0
README.md CHANGED
@@ -1,7 +1,8 @@
1
  ---
2
- base_model:
3
- - euclaise/Memphis-CoT-3B
4
  license: cc-by-4.0
 
 
 
5
  datasets:
6
  - euclaise/TinyCoT
7
  - euclaise/mathoverflow-accepted
@@ -13,9 +14,8 @@ datasets:
13
  - pszemraj/booksum-short
14
  - euclaise/reddit-instruct
15
  - euclaise/SciCoT
16
- library_name: transformers
17
- tags:
18
- - supertrainer2000
19
  ---
20
 
21
  ![image/png](https://cdn-uploads.huggingface.co/production/uploads/64137e2150358a805203cbac/wEaKoLeJzidUdTWwQmA6k.png)
 
1
  ---
 
 
2
  license: cc-by-4.0
3
+ library_name: transformers
4
+ tags:
5
+ - supertrainer2000
6
  datasets:
7
  - euclaise/TinyCoT
8
  - euclaise/mathoverflow-accepted
 
14
  - pszemraj/booksum-short
15
  - euclaise/reddit-instruct
16
  - euclaise/SciCoT
17
+ base_model:
18
+ - euclaise/Memphis-CoT-3B
 
19
  ---
20
 
21
  ![image/png](https://cdn-uploads.huggingface.co/production/uploads/64137e2150358a805203cbac/wEaKoLeJzidUdTWwQmA6k.png)
tokenizer_config.json CHANGED
@@ -203,6 +203,7 @@
203
  }
204
  },
205
  "bos_token": "<|endoftext|>",
 
206
  "clean_up_tokenization_spaces": true,
207
  "eos_token": "<|endoftext|>",
208
  "model_max_length": 1000000000000000019884624838656,
 
203
  }
204
  },
205
  "bos_token": "<|endoftext|>",
206
+ "chat_template": "{{ '### User:\n' }}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in messages %}{% if message['role'] == 'user' %}{{ message['content'].strip() + '\n' }}{% if add_generation_prompt %}{{ '### Assistant:\n' }}{% endif %}{% elif message['role'] == 'assistant' %}{{ '### Assistant:\n' + message['content'].strip() + '\n### User:\n' }}{% endif %}{% endfor %}",
207
  "clean_up_tokenization_spaces": true,
208
  "eos_token": "<|endoftext|>",
209
  "model_max_length": 1000000000000000019884624838656,