tuanle commited on
Commit
6ca3908
1 Parent(s): 640f858

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. config.json +12 -6
  2. pytorch_model.bin +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,15 +1,21 @@
1
  {
2
- "_name_or_path": "imthanhlv/gpt2news",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
6
  ],
7
- "attn_pdrop": 0.0,
8
  "bos_token_id": 50256,
9
- "embd_pdrop": 0.0,
10
  "eos_token_id": 50256,
11
  "gradient_checkpointing": false,
 
 
 
12
  "initializer_range": 0.02,
 
 
 
13
  "layer_norm_epsilon": 1e-05,
14
  "model_type": "gpt2",
15
  "n_ctx": 1024,
@@ -19,7 +25,7 @@
19
  "n_layer": 12,
20
  "n_positions": 1024,
21
  "reorder_and_upcast_attn": false,
22
- "resid_pdrop": 0.0,
23
  "scale_attn_by_inverse_layer_idx": false,
24
  "scale_attn_weights": true,
25
  "summary_activation": null,
@@ -30,11 +36,11 @@
30
  "task_specific_params": {
31
  "text-generation": {
32
  "do_sample": true,
33
- "max_length": 150
34
  }
35
  },
36
  "torch_dtype": "float32",
37
  "transformers_version": "4.16.2",
38
  "use_cache": true,
39
- "vocab_size": 50259
40
  }
 
1
  {
2
+ "_name_or_path": "danghuy1999/gpt2-viwiki",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
6
  ],
7
+ "attn_pdrop": 0.1,
8
  "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
  "eos_token_id": 50256,
11
  "gradient_checkpointing": false,
12
+ "id2label": {
13
+ "0": "LABEL_0"
14
+ },
15
  "initializer_range": 0.02,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
  "layer_norm_epsilon": 1e-05,
20
  "model_type": "gpt2",
21
  "n_ctx": 1024,
 
25
  "n_layer": 12,
26
  "n_positions": 1024,
27
  "reorder_and_upcast_attn": false,
28
+ "resid_pdrop": 0.1,
29
  "scale_attn_by_inverse_layer_idx": false,
30
  "scale_attn_weights": true,
31
  "summary_activation": null,
 
36
  "task_specific_params": {
37
  "text-generation": {
38
  "do_sample": true,
39
+ "max_length": 50
40
  }
41
  },
42
  "torch_dtype": "float32",
43
  "transformers_version": "4.16.2",
44
  "use_cache": true,
45
+ "vocab_size": 50258
46
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6aa87ac9a8d0352bd848f68c0b448759363578a50f7a7f6d2d637d0537fea59c
3
- size 510409961
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956d163f87ad360925868ccb723b9ed50d021f73387841469594f881cf54c12b
3
+ size 510406889
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:347eb7d59ce5683875397a53d9f1d0c071861a796b811deec21d5c8426bfb277
3
  size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f28080c501c962dc2785f9d48dc852a05b41e6c7083e7462f202dc0719135023
3
  size 3055