longformer-spans / checkpoint-162 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 2, checkpoint
cf33ead verified
raw
history blame
2.71 kB
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 2.0,
"eval_steps": 500,
"global_step": 162,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B": {
"f1-score": 0.8266764382557715,
"precision": 0.7866108786610879,
"recall": 0.871042471042471,
"support": 1295.0
},
"eval_I": {
"f1-score": 0.9410658617447671,
"precision": 0.9344077040239768,
"recall": 0.9478195863443808,
"support": 20065.0
},
"eval_O": {
"f1-score": 0.8562443302086484,
"precision": 0.8789421405512788,
"recall": 0.8346893055064262,
"support": 8481.0
},
"eval_accuracy": 0.912335377500754,
"eval_loss": 0.2450982630252838,
"eval_macro avg": {
"f1-score": 0.8746622100697291,
"precision": 0.8666535744121145,
"recall": 0.8845171209644261,
"support": 29841.0
},
"eval_runtime": 4.6269,
"eval_samples_per_second": 17.29,
"eval_steps_per_second": 2.161,
"eval_weighted avg": {
"f1-score": 0.9119949287205363,
"precision": 0.9122301519092053,
"recall": 0.912335377500754,
"support": 29841.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_B": {
"f1-score": 0.8833395452851286,
"precision": 0.8537463976945245,
"recall": 0.915057915057915,
"support": 1295.0
},
"eval_I": {
"f1-score": 0.9549518227873249,
"precision": 0.9516903430183636,
"recall": 0.958235733864939,
"support": 20065.0
},
"eval_O": {
"f1-score": 0.88924750463212,
"precision": 0.9016969696969697,
"recall": 0.877137130055418,
"support": 8481.0
},
"eval_accuracy": 0.9333132267685399,
"eval_loss": 0.20076116919517517,
"eval_macro avg": {
"f1-score": 0.9091796242348579,
"precision": 0.9023779034699526,
"recall": 0.916810259659424,
"support": 29841.0
},
"eval_runtime": 4.6524,
"eval_samples_per_second": 17.195,
"eval_steps_per_second": 2.149,
"eval_weighted avg": {
"f1-score": 0.9331705077630417,
"precision": 0.9332314707173981,
"recall": 0.9333132267685399,
"support": 29841.0
},
"step": 162
}
],
"logging_steps": 500,
"max_steps": 4050,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"total_flos": 287573305471200.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}