update model and readme

Browse files

Files changed (4) hide show

README.md +39 -0
config.json +4 -5
pytorch_model.bin +2 -2
tokenizer_config.json +1 -1

README.md ADDED Viewed

	@@ -0,0 +1,39 @@

+---
+language: en
+tags:
+- bart
+- distractor
+- generation
+- seq2seq
+datasets:
+- race
+metrics:
+- bleu
+- rouge
+pipeline_tag: text2text-generation
+widget:
+- text: "When you ' re having a holiday , one of the main questions to ask is which hotel or apartment to choose . However , when it comes to France , you have another special choice : treehouses . In France , treehouses are offered to travelers as a new choice in many places . The price may be a little higher , but you do have a chance to _ your childhood memories . Alain Laurens , one of France ' s top treehouse designers , said , ' Most of the people might have the experience of building a den when they were young . And they like that feeling of freedom when they are children . ' Its fairy - tale style gives travelers a special feeling . It seems as if they are living as a forest king and enjoying the fresh air in the morning . Another kind of treehouse is the ' star cube ' . It gives travelers the chance of looking at the stars shining in the sky when they are going to sleep . Each ' star cube ' not only offers all the comfortable things that a hotel provides for travelers , but also gives them a chance to look for stars by using a telescope . The glass roof allows you to look at the stars from your bed . </s> The passage mainly tells us </s> treehouses in france."
+---
+# bart-distractor-generation-pm
+## Model description
+This model is a sequence-to-sequence distractor generator which takes an answer, question and context as an input, and generates a distractor as an output. It is based on a pretrained `bart-base` model.
+This model trained with Parallel MLM refer to the [Paper](https://www.aclweb.org/anthology/2020.findings-emnlp.393/).
+For details, please see https://github.com/voidful/BDG.
+## Intended uses & limitations
+The model is trained to generate examinations-style multiple choice distractor. The model performs best with full sentence answers.
+#### How to use
+The model takes concatenated context, question and answers as an input sequence, and will generate a full distractor sentence as an output sequence. The max sequence length is 1024 tokens. Inputs should be organised into the following format:
+```
+context </s> question </s> answer
+```
+The input sequence can then be encoded and passed as the `input_ids` argument in the model's `generate()` method.
+#### Limitations and bias
+The model is limited to generating distractor in the same style as those found in [RACE](https://www.aclweb.org/anthology/D17-1082/). The generated distractors can potentially be leading or reflect biases that are present in the context. If the context is too short or completely absent, or if the context, question and answer do not match, the generated distractor is likely to be incoherent.

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "bart-distractor-generation-both",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "add_bias_logits": false,
@@ -17,7 +17,6 @@
   "decoder_layerdrop": 0.0,
   "decoder_layers": 6,
   "decoder_start_token_id": 2,
-  "do_blenderbot_90_layernorm": false,
   "dropout": 0.1,
   "early_stopping": true,
   "encoder_attention_heads": 12,
@@ -25,8 +24,8 @@
   "encoder_layerdrop": 0.0,
   "encoder_layers": 6,
   "eos_token_id": 2,
-  "extra_pos_embeddings": 2,
-  "force_bos_token_to_be_generated": false,
   "id2label": {
     "0": "LABEL_0",
     "1": "LABEL_1",
@@ -48,7 +47,6 @@
   "num_hidden_layers": 6,
   "pad_token_id": 1,
   "scale_embedding": false,
-  "static_position_embeddings": false,
   "task_specific_params": {
     "summarization": {
       "length_penalty": 1.0,
@@ -70,6 +68,7 @@
     }
   },
   "tie_word_embeddings": false,
   "use_cache": true,
   "vocab_size": 50265
 }

 {
+  "_name_or_path": "facebook/bart-base",
   "activation_dropout": 0.1,
   "activation_function": "gelu",
   "add_bias_logits": false,
   "decoder_layerdrop": 0.0,
   "decoder_layers": 6,
   "decoder_start_token_id": 2,
   "dropout": 0.1,
   "early_stopping": true,
   "encoder_attention_heads": 12,
   "encoder_layerdrop": 0.0,
   "encoder_layers": 6,
   "eos_token_id": 2,
+  "forced_eos_token_id": 2,
+  "gradient_checkpointing": false,
   "id2label": {
     "0": "LABEL_0",
     "1": "LABEL_1",
   "num_hidden_layers": 6,
   "pad_token_id": 1,
   "scale_embedding": false,
   "task_specific_params": {
     "summarization": {
       "length_penalty": 1.0,
     }
   },
   "tie_word_embeddings": false,
+  "transformers_version": "4.4.2",
   "use_cache": true,
   "vocab_size": 50265
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ee0053b528d067d2bcaca0bab4be9b64b180b4a95ba996ebec85b17e2784aa8
-size 867013518

 version https://git-lfs.github.com/spec/v1
+oid sha256:cb9f1dce141d2bd6959cbafccddd254db92b3f579040624e90db9fc30d42b3be
+size 712397879

tokenizer_config.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 1024, "name_or_path": "facebook/bart-base"}


1	+ {"unk_token": "<unk>", "bos_token": "<s>", "eos_token": "</s>", "add_prefix_space": false, "errors": "replace", "sep_token": "</s>", "cls_token": "<s>", "pad_token": "<pad>", "mask_token": "<mask>", "model_max_length": 1024, "special_tokens_map_file": null, "name_or_path": "facebook/bart-base"}