quanIta_t5 / cfg.json
Davide Montebovi
first version
4455348
raw
history blame contribute delete
802 Bytes
{
"model_name_or_path": "gsarti/it5-base",
"tokenizer_name": "gsarti/it5-base",
"dataset_name": "/content/drive/MyDrive/_colab/squad_code/my_squad_it",
"do_train": true,
"do_eval":false,
"push_to_hub" : false,
"per_device_train_batch_size": 3,
"per_device_eval_batch_size": 3,
"learning_rate": 3e-5,
"num_train_epochs": 3,
"max_seq_length": 384,
"doc_stride": 128,
"max_answer_length":30,
"n_best_size":5,
"save_steps": 500000,
"save_total_limit": 3,
"save_strategy":"steps",
"context_column": "context",
"question_column": "question",
"answer_column": "answers",
"output_dir": "./tmp/quanIta3-t5/",
"version_2_with_negative": true,
"eval_steps": 2000,
"evaluation_strategy": "steps",
"predict_with_generate":true,
"max_eval_samples": 1000
}