File size: 2,744 Bytes
fed6441
a192b2b
 
fed6441
 
 
 
 
 
 
 
 
 
a192b2b
 
 
 
fed6441
 
a192b2b
 
 
 
fed6441
 
a192b2b
 
 
 
fed6441
a192b2b
 
fed6441
a192b2b
 
 
 
fed6441
a192b2b
 
 
fed6441
a192b2b
 
 
 
fed6441
 
 
 
 
 
a192b2b
 
 
 
fed6441
 
a192b2b
 
 
 
fed6441
 
a192b2b
 
 
 
fed6441
a192b2b
 
fed6441
a192b2b
 
 
 
fed6441
a192b2b
 
 
fed6441
a192b2b
 
 
 
fed6441
 
 
 
 
a192b2b
fed6441
a192b2b
fed6441
c432d27
fed6441
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{
  "best_metric": 0.2252955436706543,
  "best_model_checkpoint": "longformer-spans/checkpoint-162",
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 162,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_B": {
        "f1-score": 0.816,
        "precision": 0.7461594732991953,
        "recall": 0.9002647837599294,
        "support": 1133.0
      },
      "eval_I": {
        "f1-score": 0.9321376763813793,
        "precision": 0.9024103768767235,
        "recall": 0.9638902525500463,
        "support": 18333.0
      },
      "eval_O": {
        "f1-score": 0.8560784528570645,
        "precision": 0.931782945736434,
        "recall": 0.7917511147142278,
        "support": 9868.0
      },
      "eval_accuracy": 0.9035249198881844,
      "eval_loss": 0.2619660496711731,
      "eval_macro avg": {
        "f1-score": 0.8680720430794812,
        "precision": 0.860117598637451,
        "recall": 0.8853020503414012,
        "support": 29334.0
      },
      "eval_runtime": 5.5032,
      "eval_samples_per_second": 14.537,
      "eval_steps_per_second": 1.817,
      "eval_weighted avg": {
        "f1-score": 0.9020655278480035,
        "precision": 0.9062562975065145,
        "recall": 0.9035249198881844,
        "support": 29334.0
      },
      "step": 81
    },
    {
      "epoch": 2.0,
      "eval_B": {
        "f1-score": 0.8512256973795435,
        "precision": 0.8167072181670721,
        "recall": 0.8887908208296558,
        "support": 1133.0
      },
      "eval_I": {
        "f1-score": 0.9416781438711729,
        "precision": 0.9152551099212274,
        "recall": 0.9696721758577429,
        "support": 18333.0
      },
      "eval_O": {
        "f1-score": 0.8778173190984578,
        "precision": 0.9380041484212952,
        "recall": 0.8248885285772193,
        "support": 9868.0
      },
      "eval_accuracy": 0.9178427763005387,
      "eval_loss": 0.2252955436706543,
      "eval_macro avg": {
        "f1-score": 0.8902403867830581,
        "precision": 0.8899888255031981,
        "recall": 0.8944505084215394,
        "support": 29334.0
      },
      "eval_runtime": 5.4972,
      "eval_samples_per_second": 14.553,
      "eval_steps_per_second": 1.819,
      "eval_weighted avg": {
        "f1-score": 0.9167016237671239,
        "precision": 0.9191015935430046,
        "recall": 0.9178427763005387,
        "support": 29334.0
      },
      "step": 162
    }
  ],
  "logging_steps": 500,
  "max_steps": 1620,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 20,
  "save_steps": 500,
  "total_flos": 287573305471200.0,
  "train_batch_size": 4,
  "trial_name": null,
  "trial_params": null
}