hippopotam commited on
Commit
c98b088
1 Parent(s): e9165d4

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +14 -0
  2. eval_results.json +9 -0
  3. train_results.json +8 -0
  4. trainer_state.json +127 -0
all_results.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 19.82,
3
+ "eval_loss": 0.5335429310798645,
4
+ "eval_runtime": 100.4145,
5
+ "eval_samples": 1647,
6
+ "eval_samples_per_second": 16.402,
7
+ "eval_steps_per_second": 1.026,
8
+ "eval_wer": 0.493922990501481,
9
+ "train_loss": 1.770811665499652,
10
+ "train_runtime": 22430.6801,
11
+ "train_samples": 3478,
12
+ "train_samples_per_second": 3.101,
13
+ "train_steps_per_second": 0.048
14
+ }
eval_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 19.82,
3
+ "eval_loss": 0.5335429310798645,
4
+ "eval_runtime": 100.4145,
5
+ "eval_samples": 1647,
6
+ "eval_samples_per_second": 16.402,
7
+ "eval_steps_per_second": 1.026,
8
+ "eval_wer": 0.493922990501481
9
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 19.82,
3
+ "train_loss": 1.770811665499652,
4
+ "train_runtime": 22430.6801,
5
+ "train_samples": 3478,
6
+ "train_samples_per_second": 3.101,
7
+ "train_steps_per_second": 0.048
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,127 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 19.81651376146789,
5
+ "global_step": 1080,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.83,
12
+ "eval_loss": 4.108390808105469,
13
+ "eval_runtime": 103.6273,
14
+ "eval_samples_per_second": 15.893,
15
+ "eval_steps_per_second": 0.994,
16
+ "eval_wer": 1.0,
17
+ "step": 100
18
+ },
19
+ {
20
+ "epoch": 3.67,
21
+ "eval_loss": 3.1519322395324707,
22
+ "eval_runtime": 103.1635,
23
+ "eval_samples_per_second": 15.965,
24
+ "eval_steps_per_second": 0.998,
25
+ "eval_wer": 1.0,
26
+ "step": 200
27
+ },
28
+ {
29
+ "epoch": 5.5,
30
+ "eval_loss": 1.9347835779190063,
31
+ "eval_runtime": 102.3063,
32
+ "eval_samples_per_second": 16.099,
33
+ "eval_steps_per_second": 1.007,
34
+ "eval_wer": 0.9798794811561639,
35
+ "step": 300
36
+ },
37
+ {
38
+ "epoch": 7.34,
39
+ "eval_loss": 0.7185050249099731,
40
+ "eval_runtime": 102.0354,
41
+ "eval_samples_per_second": 16.141,
42
+ "eval_steps_per_second": 1.009,
43
+ "eval_wer": 0.74895312021244,
44
+ "step": 400
45
+ },
46
+ {
47
+ "epoch": 9.17,
48
+ "learning_rate": 0.0001996,
49
+ "loss": 3.6165,
50
+ "step": 500
51
+ },
52
+ {
53
+ "epoch": 9.17,
54
+ "eval_loss": 0.6041333079338074,
55
+ "eval_runtime": 101.7041,
56
+ "eval_samples_per_second": 16.194,
57
+ "eval_steps_per_second": 1.013,
58
+ "eval_wer": 0.636809314676744,
59
+ "step": 500
60
+ },
61
+ {
62
+ "epoch": 11.01,
63
+ "eval_loss": 0.5609970092773438,
64
+ "eval_runtime": 102.5678,
65
+ "eval_samples_per_second": 16.058,
66
+ "eval_steps_per_second": 1.004,
67
+ "eval_wer": 0.5770605658257584,
68
+ "step": 600
69
+ },
70
+ {
71
+ "epoch": 12.84,
72
+ "eval_loss": 0.5291760563850403,
73
+ "eval_runtime": 101.4306,
74
+ "eval_samples_per_second": 16.238,
75
+ "eval_steps_per_second": 1.015,
76
+ "eval_wer": 0.5397814319272801,
77
+ "step": 700
78
+ },
79
+ {
80
+ "epoch": 14.68,
81
+ "eval_loss": 0.5242128968238831,
82
+ "eval_runtime": 100.8318,
83
+ "eval_samples_per_second": 16.334,
84
+ "eval_steps_per_second": 1.022,
85
+ "eval_wer": 0.5083239709937698,
86
+ "step": 800
87
+ },
88
+ {
89
+ "epoch": 16.51,
90
+ "eval_loss": 0.5442604422569275,
91
+ "eval_runtime": 101.3912,
92
+ "eval_samples_per_second": 16.244,
93
+ "eval_steps_per_second": 1.016,
94
+ "eval_wer": 0.5037279133898478,
95
+ "step": 900
96
+ },
97
+ {
98
+ "epoch": 18.35,
99
+ "learning_rate": 2.7931034482758622e-05,
100
+ "loss": 0.1894,
101
+ "step": 1000
102
+ },
103
+ {
104
+ "epoch": 18.35,
105
+ "eval_loss": 0.5313596725463867,
106
+ "eval_runtime": 102.9424,
107
+ "eval_samples_per_second": 15.999,
108
+ "eval_steps_per_second": 1.001,
109
+ "eval_wer": 0.49443366356858337,
110
+ "step": 1000
111
+ },
112
+ {
113
+ "epoch": 19.82,
114
+ "step": 1080,
115
+ "total_flos": 8.773864807508535e+18,
116
+ "train_loss": 1.770811665499652,
117
+ "train_runtime": 22430.6801,
118
+ "train_samples_per_second": 3.101,
119
+ "train_steps_per_second": 0.048
120
+ }
121
+ ],
122
+ "max_steps": 1080,
123
+ "num_train_epochs": 20,
124
+ "total_flos": 8.773864807508535e+18,
125
+ "trial_name": null,
126
+ "trial_params": null
127
+ }