Theoreticallyhugo commited on
Commit
afba4e7
1 Parent(s): 546d30f

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9123959af3f5dd3fdeb56cccc82654b70d6c266ab2411dfe944fc31d546b1ab9
3
  size 592318676
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dc5d0ba734c8019fa04c361bf322ee1c8bf7931635d51072f2aad24342cdc17
3
  size 592318676
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6284a75f91ce26e97a7215befc9d63db452c6cab7685e34c895d01044783a56c
3
  size 1014645498
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14acd6c94a909cef1e34eda727f8339a9ae29cfe4d16e70d3a047ffbe78f753f
3
  size 1014645498
checkpoint-41/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a939982f711c8a91f0893b4f281f0db4fd89d7ca52de2aed82098ef9ff76ea2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b75d0f85c6e5f43bda08f24453a869f5d0b5d0d33d936ef1b542f406f081347
3
  size 14244
checkpoint-41/trainer_state.json CHANGED
@@ -11,39 +11,39 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_B": {
14
- "f1-score": 0.6054590570719602,
15
- "precision": 0.8472222222222222,
16
- "recall": 0.47104247104247104,
17
- "support": 1295.0
18
  },
19
  "eval_I": {
20
- "f1-score": 0.9281628372580799,
21
- "precision": 0.8894522863277146,
22
- "recall": 0.9703962123099925,
23
- "support": 20065.0
24
  },
25
  "eval_O": {
26
- "f1-score": 0.826809241932404,
27
- "precision": 0.8983402489626556,
28
- "recall": 0.7658295012380616,
29
- "support": 8481.0
30
  },
31
- "eval_accuracy": 0.8905867765825543,
32
- "eval_loss": 0.3152744174003601,
33
  "eval_macro avg": {
34
- "f1-score": 0.786810378754148,
35
- "precision": 0.8783382525041974,
36
- "recall": 0.735756061530175,
37
- "support": 29841.0
38
  },
39
- "eval_runtime": 1.3493,
40
- "eval_samples_per_second": 59.291,
41
- "eval_steps_per_second": 7.411,
42
  "eval_weighted avg": {
43
- "f1-score": 0.8853532384745914,
44
- "precision": 0.8901456571293072,
45
- "recall": 0.8905867765825543,
46
- "support": 29841.0
47
  },
48
  "step": 41
49
  }
@@ -53,7 +53,7 @@
53
  "num_input_tokens_seen": 0,
54
  "num_train_epochs": 16,
55
  "save_steps": 500,
56
- "total_flos": 143786652735600.0,
57
  "train_batch_size": 8,
58
  "trial_name": null,
59
  "trial_params": null
 
11
  {
12
  "epoch": 1.0,
13
  "eval_B": {
14
+ "f1-score": 0.6659475008989573,
15
+ "precision": 0.6905294556301268,
16
+ "recall": 0.6430555555555556,
17
+ "support": 1440.0
18
  },
19
  "eval_I": {
20
+ "f1-score": 0.9167863956473609,
21
+ "precision": 0.9325347388596071,
22
+ "recall": 0.9015611247510076,
23
+ "support": 21587.0
24
  },
25
  "eval_O": {
26
+ "f1-score": 0.8443157797996509,
27
+ "precision": 0.8138010452653025,
28
+ "recall": 0.8772080588179128,
29
+ "support": 10473.0
30
  },
31
+ "eval_accuracy": 0.8828358208955224,
32
+ "eval_loss": 0.31183817982673645,
33
  "eval_macro avg": {
34
+ "f1-score": 0.8090165587819897,
35
+ "precision": 0.8122884132516788,
36
+ "recall": 0.8072749130414919,
37
+ "support": 33500.0
38
  },
39
+ "eval_runtime": 1.3725,
40
+ "eval_samples_per_second": 59.018,
41
+ "eval_steps_per_second": 8.015,
42
  "eval_weighted avg": {
43
+ "f1-score": 0.8833478055515172,
44
+ "precision": 0.8850127812218876,
45
+ "recall": 0.8828358208955224,
46
+ "support": 33500.0
47
  },
48
  "step": 41
49
  }
 
53
  "num_input_tokens_seen": 0,
54
  "num_train_epochs": 16,
55
  "save_steps": 500,
56
+ "total_flos": 143340110335800.0,
57
  "train_batch_size": 8,
58
  "trial_name": null,
59
  "trial_params": null
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfd4286d28d76d8e118be26c28e11f81993aa41382921ccbb13e9cdeb7b58cf4
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9afc9010526d77714317ce08b144ea519027c2bf7e4a39f3188a1467d7fdf528
3
  size 4664