Priyanship commited on
Commit
ae87643
·
verified ·
1 Parent(s): d807d66

End of training

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model was trained from scratch on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: 1151.3530
20
  - Wer: 1.0
21
  - Cer: 1.0
22
 
 
16
 
17
  This model was trained from scratch on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 1150.0363
20
  - Wer: 1.0
21
  - Cer: 1.0
22
 
all_results.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.0,
3
+ "eval_cer": 1.0,
4
+ "eval_loss": 1150.0362548828125,
5
+ "eval_runtime": 23.9604,
6
+ "eval_samples": 890,
7
+ "eval_samples_per_second": 37.145,
8
+ "eval_steps_per_second": 4.674,
9
+ "eval_wer": 1.0,
10
+ "total_flos": 5.519100286987747e+18,
11
+ "train_loss": 3828.2266203703703,
12
+ "train_runtime": 3861.8113,
13
+ "train_samples": 17267,
14
+ "train_samples_per_second": 89.424,
15
+ "train_steps_per_second": 5.593
16
+ }
eval--in domain_results.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.0,
3
+ "eval_cer": 1.0,
4
+ "eval_loss": 1150.0362548828125,
5
+ "eval_runtime": 23.9604,
6
+ "eval_samples": 890,
7
+ "eval_samples_per_second": 37.145,
8
+ "eval_steps_per_second": 4.674,
9
+ "eval_wer": 1.0
10
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 6.0,
3
+ "total_flos": 5.519100286987747e+18,
4
+ "train_loss": 3828.2266203703703,
5
+ "train_runtime": 3861.8113,
6
+ "train_samples": 17267,
7
+ "train_samples_per_second": 89.424,
8
+ "train_steps_per_second": 5.593
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,153 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 1.0,
3
+ "best_model_checkpoint": "/scratch/elec/puhe/p/palp3/sami_ASR/base_model_output/wav2vec2-base-sami-cont-pt-22k/outputs/shuff_142/ftpseudowr20esp5/checkpoint-1080",
4
+ "epoch": 6.0,
5
+ "eval_steps": 500,
6
+ "global_step": 6480,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "grad_norm": 110.69710540771484,
14
+ "learning_rate": 0.00012337962962962964,
15
+ "loss": 4511.6611,
16
+ "step": 1080
17
+ },
18
+ {
19
+ "epoch": 1.0,
20
+ "eval_cer": 1.0,
21
+ "eval_loss": 1149.935302734375,
22
+ "eval_runtime": 23.6152,
23
+ "eval_samples_per_second": 37.688,
24
+ "eval_steps_per_second": 4.743,
25
+ "eval_wer": 1.0,
26
+ "step": 1080
27
+ },
28
+ {
29
+ "epoch": 2.0,
30
+ "grad_norm": 134.31155395507812,
31
+ "learning_rate": 0.00024837962962962964,
32
+ "loss": 3591.4514,
33
+ "step": 2160
34
+ },
35
+ {
36
+ "epoch": 2.0,
37
+ "eval_cer": 1.0,
38
+ "eval_loss": 1155.4658203125,
39
+ "eval_runtime": 23.3518,
40
+ "eval_samples_per_second": 38.113,
41
+ "eval_steps_per_second": 4.796,
42
+ "eval_wer": 1.0,
43
+ "step": 2160
44
+ },
45
+ {
46
+ "epoch": 3.0,
47
+ "grad_norm": 156.53646850585938,
48
+ "learning_rate": 0.00037337962962962965,
49
+ "loss": 3649.9262,
50
+ "step": 3240
51
+ },
52
+ {
53
+ "epoch": 3.0,
54
+ "eval_cer": 1.0,
55
+ "eval_loss": 1155.608154296875,
56
+ "eval_runtime": 23.3593,
57
+ "eval_samples_per_second": 38.1,
58
+ "eval_steps_per_second": 4.795,
59
+ "eval_wer": 1.0,
60
+ "step": 3240
61
+ },
62
+ {
63
+ "epoch": 4.0,
64
+ "grad_norm": 100.56692504882812,
65
+ "learning_rate": 0.0004982638888888889,
66
+ "loss": 3789.6616,
67
+ "step": 4320
68
+ },
69
+ {
70
+ "epoch": 4.0,
71
+ "eval_cer": 1.0,
72
+ "eval_loss": 1146.7283935546875,
73
+ "eval_runtime": 23.3466,
74
+ "eval_samples_per_second": 38.121,
75
+ "eval_steps_per_second": 4.797,
76
+ "eval_wer": 1.0,
77
+ "step": 4320
78
+ },
79
+ {
80
+ "epoch": 5.0,
81
+ "grad_norm": 103.7132568359375,
82
+ "learning_rate": 0.0004691840277777778,
83
+ "loss": 3752.8502,
84
+ "step": 5400
85
+ },
86
+ {
87
+ "epoch": 5.0,
88
+ "eval_cer": 1.0,
89
+ "eval_loss": 1158.9339599609375,
90
+ "eval_runtime": 26.3666,
91
+ "eval_samples_per_second": 33.755,
92
+ "eval_steps_per_second": 4.248,
93
+ "eval_wer": 1.0,
94
+ "step": 5400
95
+ },
96
+ {
97
+ "epoch": 6.0,
98
+ "grad_norm": 97.61384582519531,
99
+ "learning_rate": 0.0004379340277777778,
100
+ "loss": 3673.8093,
101
+ "step": 6480
102
+ },
103
+ {
104
+ "epoch": 6.0,
105
+ "eval_cer": 1.0,
106
+ "eval_loss": 1151.35302734375,
107
+ "eval_runtime": 25.4193,
108
+ "eval_samples_per_second": 35.013,
109
+ "eval_steps_per_second": 4.406,
110
+ "eval_wer": 1.0,
111
+ "step": 6480
112
+ },
113
+ {
114
+ "epoch": 6.0,
115
+ "step": 6480,
116
+ "total_flos": 5.519100286987747e+18,
117
+ "train_loss": 3828.2266203703703,
118
+ "train_runtime": 3861.8113,
119
+ "train_samples_per_second": 89.424,
120
+ "train_steps_per_second": 5.593
121
+ }
122
+ ],
123
+ "logging_steps": 500,
124
+ "max_steps": 21600,
125
+ "num_input_tokens_seen": 0,
126
+ "num_train_epochs": 20,
127
+ "save_steps": 500,
128
+ "stateful_callbacks": {
129
+ "EarlyStoppingCallback": {
130
+ "args": {
131
+ "early_stopping_patience": 5,
132
+ "early_stopping_threshold": 0.0
133
+ },
134
+ "attributes": {
135
+ "early_stopping_patience_counter": 5
136
+ }
137
+ },
138
+ "TrainerControl": {
139
+ "args": {
140
+ "should_epoch_stop": false,
141
+ "should_evaluate": false,
142
+ "should_log": false,
143
+ "should_save": true,
144
+ "should_training_stop": true
145
+ },
146
+ "attributes": {}
147
+ }
148
+ },
149
+ "total_flos": 5.519100286987747e+18,
150
+ "train_batch_size": 16,
151
+ "trial_name": null,
152
+ "trial_params": null
153
+ }