anton-l HF staff commited on
Commit
ff8617c
1 Parent(s): 1846853

End of training

Browse files
all_results.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_cer": 0.13557177967326875,
4
+ "eval_loss": 0.5598823428153992,
5
+ "eval_runtime": 13.1271,
6
+ "eval_samples_per_second": 49.287,
7
+ "eval_steps_per_second": 6.17,
8
+ "eval_wer": 0.31477832512315274,
9
+ "predict_samples": 647,
10
+ "train_loss": 1.155013433122852,
11
+ "train_runtime": 1766.4943,
12
+ "train_samples": 2550,
13
+ "train_samples_per_second": 43.306,
14
+ "train_steps_per_second": 0.679
15
+ }
config.json CHANGED
@@ -99,7 +99,7 @@
99
  1,
100
  1
101
  ],
102
- "torch_dtype": "float32",
103
  "transformers_version": "4.18.0.dev0",
104
  "use_weighted_layer_sum": false,
105
  "vocab_size": 60,
 
99
  1,
100
  1
101
  ],
102
+ "torch_dtype": "float16",
103
  "transformers_version": "4.18.0.dev0",
104
  "use_weighted_layer_sum": false,
105
  "vocab_size": 60,
predict_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_cer": 0.13557177967326875,
4
+ "eval_loss": 0.5598823428153992,
5
+ "eval_runtime": 13.1271,
6
+ "eval_samples_per_second": 49.287,
7
+ "eval_steps_per_second": 6.17,
8
+ "eval_wer": 0.31477832512315274,
9
+ "predict_samples": 647
10
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac4c92e046036478dab89d42e824431ab1137aadf8469a9d8e88839ef6d85088
3
- size 1262172273
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0b7512897c93bb57be775272565263faf5e6f675275fb059051b66d5466c7005
3
+ size 631171825
runs/Apr28_10-44-54_anton-xtreme-s/events.out.tfevents.1651144619.anton-xtreme-s.31733.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f00af37b65d9acf2f699954ecb493aa06c54c5a0a6cdbabd07a6e4d0394dce7
3
+ size 830
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "train_loss": 1.155013433122852,
4
+ "train_runtime": 1766.4943,
5
+ "train_samples": 2550,
6
+ "train_samples_per_second": 43.306,
7
+ "train_steps_per_second": 0.679
8
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff