File size: 2,512 Bytes
715422c
 
 
19a3c5e
 
715422c
 
 
 
 
19a3c5e
711bff1
19a3c5e
711bff1
8135567
 
19a3c5e
 
 
 
 
 
711bff1
8135567
 
19a3c5e
 
 
711bff1
8135567
 
19a3c5e
 
 
 
 
 
711bff1
8135567
 
19a3c5e
 
 
711bff1
8135567
 
19a3c5e
 
 
 
 
 
711bff1
8135567
 
19a3c5e
 
 
711bff1
715422c
 
19a3c5e
 
 
 
 
 
711bff1
715422c
 
19a3c5e
 
 
711bff1
8135567
 
19a3c5e
 
 
 
 
 
711bff1
8135567
 
19a3c5e
 
 
711bff1
8135567
 
19a3c5e
 
 
 
 
 
711bff1
715422c
 
19a3c5e
711bff1
19a3c5e
715422c
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 7.407407407407407,
  "global_step": 600,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.23,
      "learning_rate": 0.0001,
      "loss": 0.0625,
      "step": 100
    },
    {
      "epoch": 1.23,
      "eval_loss": 0.28051668405532837,
      "eval_runtime": 198.6071,
      "eval_samples_per_second": 16.374,
      "eval_steps_per_second": 2.049,
      "eval_wer": 0.2381097005406062,
      "step": 100
    },
    {
      "epoch": 2.47,
      "learning_rate": 9.987639060568604e-05,
      "loss": 0.047,
      "step": 200
    },
    {
      "epoch": 2.47,
      "eval_loss": 0.34423157572746277,
      "eval_runtime": 147.7154,
      "eval_samples_per_second": 22.015,
      "eval_steps_per_second": 2.755,
      "eval_wer": 0.2334325457085586,
      "step": 200
    },
    {
      "epoch": 3.7,
      "learning_rate": 9.975278121137207e-05,
      "loss": 0.0409,
      "step": 300
    },
    {
      "epoch": 3.7,
      "eval_loss": 0.3597787916660309,
      "eval_runtime": 156.092,
      "eval_samples_per_second": 20.834,
      "eval_steps_per_second": 2.607,
      "eval_wer": 0.23124582396889995,
      "step": 300
    },
    {
      "epoch": 4.94,
      "learning_rate": 9.96291718170581e-05,
      "loss": 0.0413,
      "step": 400
    },
    {
      "epoch": 4.94,
      "eval_loss": 0.35860675573349,
      "eval_runtime": 151.5312,
      "eval_samples_per_second": 21.461,
      "eval_steps_per_second": 2.686,
      "eval_wer": 0.2421794326671931,
      "step": 400
    },
    {
      "epoch": 6.17,
      "learning_rate": 9.950556242274414e-05,
      "loss": 0.0388,
      "step": 500
    },
    {
      "epoch": 6.17,
      "eval_loss": 0.3748931586742401,
      "eval_runtime": 154.1563,
      "eval_samples_per_second": 21.095,
      "eval_steps_per_second": 2.64,
      "eval_wer": 0.23914231913988945,
      "step": 500
    },
    {
      "epoch": 7.41,
      "learning_rate": 9.938195302843017e-05,
      "loss": 0.0383,
      "step": 600
    },
    {
      "epoch": 7.41,
      "eval_loss": 0.36109668016433716,
      "eval_runtime": 163.2656,
      "eval_samples_per_second": 19.918,
      "eval_steps_per_second": 2.493,
      "eval_wer": 0.2352548138249408,
      "step": 600
    }
  ],
  "max_steps": 81000,
  "num_train_epochs": 1000,
  "total_flos": 1.9144703855961313e+19,
  "trial_name": null,
  "trial_params": null
}