winegarj commited on
Commit
8eeede7
1 Parent(s): dffa754

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -28,6 +28,6 @@
28
  "sinusoidal_pos_embds": false,
29
  "tie_weights_": true,
30
  "torch_dtype": "float32",
31
- "transformers_version": "4.18.0",
32
  "vocab_size": 30522
33
  }
 
28
  "sinusoidal_pos_embds": false,
29
  "tie_weights_": true,
30
  "torch_dtype": "float32",
31
+ "transformers_version": "4.21.1",
32
  "vocab_size": 30522
33
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:974feff4516334983e43bcdc913852e05f059e8443a3bed990da981e50869e2f
3
  size 267854321
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:345a6b33b2e6ccdcc5cf649259394798ab6f654876539e273d7ad4c82007b634
3
  size 267854321
special_tokens_map.json CHANGED
@@ -1 +1,7 @@
1
- {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -1 +1,14 @@
1
- {"do_lower_case": true, "unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]", "tokenize_chinese_chars": true, "strip_accents": null, "model_max_length": 512, "special_tokens_map_file": null, "name_or_path": "distilbert-base-uncased", "tokenizer_class": "DistilBertTokenizer"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "do_lower_case": true,
4
+ "mask_token": "[MASK]",
5
+ "model_max_length": 512,
6
+ "name_or_path": "distilbert-base-uncased",
7
+ "pad_token": "[PAD]",
8
+ "sep_token": "[SEP]",
9
+ "special_tokens_map_file": null,
10
+ "strip_accents": null,
11
+ "tokenize_chinese_chars": true,
12
+ "tokenizer_class": "DistilBertTokenizer",
13
+ "unk_token": "[UNK]"
14
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a6c73ff79397337d4abfbf34ed67b8a76a69f4cc73ad3042e288ffc2655e1f3
3
- size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94cd992b131ecbf0f3f4d9d45a5e60a3530d146ec35620fcd3eadc55a734eb17
3
+ size 3375