File size: 1,456 Bytes
a4fc8c1
 
 
31999ff
 
a4fc8c1
 
 
 
78c3b6b
31999ff
 
 
cdbe678
5165428
25af1c0
31999ff
 
 
25af1c0
 
449018b
31999ff
 
 
cdbe678
25af1c0
 
31999ff
 
 
25af1c0
 
 
31999ff
 
 
cdbe678
25af1c0
 
31999ff
 
 
25af1c0
 
 
31999ff
 
 
449018b
 
 
31999ff
 
 
 
 
 
 
a4fc8c1
 
31999ff
5165428
31999ff
a4fc8c1
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 12.087431693989071,
  "global_step": 1100,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.64,
      "learning_rate": 4.999725244532367e-06,
      "loss": 0.0243,
      "step": 150
    },
    {
      "epoch": 3.3,
      "learning_rate": 4.998900978129465e-06,
      "loss": 0.0192,
      "step": 300
    },
    {
      "epoch": 4.94,
      "learning_rate": 4.998076711726564e-06,
      "loss": 0.0175,
      "step": 450
    },
    {
      "epoch": 6.59,
      "learning_rate": 4.997252445323663e-06,
      "loss": 0.0174,
      "step": 600
    },
    {
      "epoch": 8.24,
      "learning_rate": 4.996428178920761e-06,
      "loss": 0.0168,
      "step": 750
    },
    {
      "epoch": 9.89,
      "learning_rate": 4.995609407627212e-06,
      "loss": 0.0175,
      "step": 900
    },
    {
      "epoch": 11.54,
      "learning_rate": 4.994785141224311e-06,
      "loss": 0.0168,
      "step": 1050
    },
    {
      "epoch": 12.09,
      "eval_loss": 0.23020002245903015,
      "eval_runtime": 433.719,
      "eval_samples_per_second": 9.407,
      "eval_steps_per_second": 1.176,
      "eval_wer": 0.16092909535452324,
      "step": 1100
    }
  ],
  "max_steps": 910000,
  "num_train_epochs": 10000,
  "total_flos": 3.930570221142893e+19,
  "trial_name": null,
  "trial_params": null
}