zubairsalman7 commited on
Commit
92741e5
·
verified ·
1 Parent(s): dd8a334

End of training

Browse files
README.md CHANGED
@@ -3,6 +3,9 @@ library_name: transformers
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
 
 
 
6
  - generated_from_trainer
7
  metrics:
8
  - accuracy
@@ -16,10 +19,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # vit-xray-tumor
18
 
19
- This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.2761
22
- - Accuracy: 0.9595
23
 
24
  ## Model description
25
 
 
3
  license: apache-2.0
4
  base_model: google/vit-base-patch16-224-in21k
5
  tags:
6
+ - medical-imaging
7
+ - chest-xray
8
+ - tumor-detection
9
  - generated_from_trainer
10
  metrics:
11
  - accuracy
 
19
 
20
  # vit-xray-tumor
21
 
22
+ This model is a fine-tuned version of [google/vit-base-patch16-224-in21k](https://huggingface.co/google/vit-base-patch16-224-in21k) on the chest-xray-tumor dataset.
23
  It achieves the following results on the evaluation set:
24
+ - Loss: 0.2989
25
+ - Accuracy: 0.9574
26
 
27
  ## Model description
28
 
all_results.json CHANGED
@@ -1,13 +1,13 @@
1
  {
2
  "epoch": 20.0,
3
  "eval_accuracy": 0.9573894282632147,
4
- "eval_loss": 0.304302453994751,
5
- "eval_runtime": 3.0558,
6
- "eval_samples_per_second": 606.721,
7
- "eval_steps_per_second": 2.618,
8
  "total_flos": 1.3409213882909e+19,
9
- "train_loss": 0.49313004542799554,
10
- "train_runtime": 263.7994,
11
- "train_samples_per_second": 655.953,
12
- "train_steps_per_second": 2.578
13
  }
 
1
  {
2
  "epoch": 20.0,
3
  "eval_accuracy": 0.9573894282632147,
4
+ "eval_loss": 0.2989387512207031,
5
+ "eval_runtime": 3.1028,
6
+ "eval_samples_per_second": 597.518,
7
+ "eval_steps_per_second": 2.578,
8
  "total_flos": 1.3409213882909e+19,
9
+ "train_loss": 0.5017087179071763,
10
+ "train_runtime": 256.3708,
11
+ "train_samples_per_second": 674.96,
12
+ "train_steps_per_second": 2.652
13
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "eval_accuracy": 0.9573894282632147,
4
- "eval_loss": 0.304302453994751,
5
- "eval_runtime": 3.0558,
6
- "eval_samples_per_second": 606.721,
7
- "eval_steps_per_second": 2.618
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "eval_accuracy": 0.9573894282632147,
4
+ "eval_loss": 0.2989387512207031,
5
+ "eval_runtime": 3.1028,
6
+ "eval_samples_per_second": 597.518,
7
+ "eval_steps_per_second": 2.578
8
  }
runs/Dec04_19-59-41_a5f419f997b4/events.out.tfevents.1733342662.a5f419f997b4.7191.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88bf6900aab1315fc7d5c90ed6069adc4568f2dbe9bec50e08b62ce29233f0c9
3
+ size 411
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 20.0,
3
  "total_flos": 1.3409213882909e+19,
4
- "train_loss": 0.49313004542799554,
5
- "train_runtime": 263.7994,
6
- "train_samples_per_second": 655.953,
7
- "train_steps_per_second": 2.578
8
  }
 
1
  {
2
  "epoch": 20.0,
3
  "total_flos": 1.3409213882909e+19,
4
+ "train_loss": 0.5017087179071763,
5
+ "train_runtime": 256.3708,
6
+ "train_samples_per_second": 674.96,
7
+ "train_steps_per_second": 2.652
8
  }
trainer_state.json CHANGED
@@ -10,246 +10,246 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.7352941176470589,
13
- "grad_norm": 0.38581621646881104,
14
  "learning_rate": 2.5e-06,
15
- "loss": 0.6951,
16
  "step": 25
17
  },
18
  {
19
  "epoch": 1.4705882352941178,
20
- "grad_norm": 0.5082659721374512,
21
  "learning_rate": 5e-06,
22
- "loss": 0.6485,
23
  "step": 50
24
  },
25
  {
26
  "epoch": 2.2058823529411766,
27
- "grad_norm": 0.2886718809604645,
28
  "learning_rate": 7.500000000000001e-06,
29
- "loss": 0.5551,
30
  "step": 75
31
  },
32
  {
33
  "epoch": 2.9411764705882355,
34
- "grad_norm": 0.3792360723018646,
35
  "learning_rate": 1e-05,
36
- "loss": 0.5264,
37
  "step": 100
38
  },
39
  {
40
  "epoch": 3.6764705882352944,
41
- "grad_norm": 0.3348362445831299,
42
  "learning_rate": 9.954227982894034e-06,
43
- "loss": 0.5275,
44
  "step": 125
45
  },
46
  {
47
  "epoch": 3.6764705882352944,
48
  "eval_accuracy": 0.9606256742179072,
49
- "eval_loss": 0.29926320910453796,
50
- "eval_runtime": 3.4401,
51
- "eval_samples_per_second": 538.942,
52
- "eval_steps_per_second": 2.326,
53
  "step": 125
54
  },
55
  {
56
  "epoch": 4.411764705882353,
57
- "grad_norm": 0.30328646302223206,
58
  "learning_rate": 9.817749962596115e-06,
59
- "loss": 0.5174,
60
  "step": 150
61
  },
62
  {
63
  "epoch": 5.147058823529412,
64
- "grad_norm": 0.28701943159103394,
65
  "learning_rate": 9.59306468881811e-06,
66
- "loss": 0.5126,
67
  "step": 175
68
  },
69
  {
70
  "epoch": 5.882352941176471,
71
- "grad_norm": 0.4482644498348236,
72
  "learning_rate": 9.284285880837947e-06,
73
- "loss": 0.5135,
74
  "step": 200
75
  },
76
  {
77
  "epoch": 6.617647058823529,
78
- "grad_norm": 0.4473366141319275,
79
  "learning_rate": 8.897066910207958e-06,
80
- "loss": 0.5019,
81
  "step": 225
82
  },
83
  {
84
  "epoch": 7.352941176470588,
85
- "grad_norm": 0.7015063166618347,
86
  "learning_rate": 8.438497294267117e-06,
87
- "loss": 0.5129,
88
  "step": 250
89
  },
90
  {
91
  "epoch": 7.352941176470588,
92
- "eval_accuracy": 0.9606256742179072,
93
- "eval_loss": 0.28240302205085754,
94
- "eval_runtime": 3.4557,
95
- "eval_samples_per_second": 536.501,
96
- "eval_steps_per_second": 2.315,
97
  "step": 250
98
  },
99
  {
100
  "epoch": 8.088235294117647,
101
- "grad_norm": 0.6289227604866028,
102
  "learning_rate": 7.916972895537471e-06,
103
- "loss": 0.5036,
104
  "step": 275
105
  },
106
  {
107
  "epoch": 8.823529411764707,
108
- "grad_norm": 0.5625348091125488,
109
  "learning_rate": 7.342042203498952e-06,
110
- "loss": 0.4982,
111
  "step": 300
112
  },
113
  {
114
  "epoch": 9.558823529411764,
115
- "grad_norm": 0.5729047656059265,
116
  "learning_rate": 6.724231513139853e-06,
117
- "loss": 0.5002,
118
  "step": 325
119
  },
120
  {
121
  "epoch": 10.294117647058824,
122
- "grad_norm": 0.584720253944397,
123
  "learning_rate": 6.074852201055121e-06,
124
- "loss": 0.4852,
125
  "step": 350
126
  },
127
  {
128
  "epoch": 11.029411764705882,
129
- "grad_norm": 0.7636251449584961,
130
  "learning_rate": 5.405793627637157e-06,
131
- "loss": 0.4798,
132
  "step": 375
133
  },
134
  {
135
  "epoch": 11.029411764705882,
136
- "eval_accuracy": 0.9606256742179072,
137
- "eval_loss": 0.2859905958175659,
138
- "eval_runtime": 3.4319,
139
- "eval_samples_per_second": 540.227,
140
- "eval_steps_per_second": 2.331,
141
  "step": 375
142
  },
143
  {
144
  "epoch": 11.764705882352942,
145
- "grad_norm": 0.8783677220344543,
146
  "learning_rate": 4.729305457072913e-06,
147
- "loss": 0.4716,
148
  "step": 400
149
  },
150
  {
151
  "epoch": 12.5,
152
- "grad_norm": 0.9321892261505127,
153
  "learning_rate": 4.057773380608411e-06,
154
- "loss": 0.4717,
155
  "step": 425
156
  },
157
  {
158
  "epoch": 13.235294117647058,
159
- "grad_norm": 0.9250620603561401,
160
  "learning_rate": 3.403492349320101e-06,
161
- "loss": 0.4582,
162
  "step": 450
163
  },
164
  {
165
  "epoch": 13.970588235294118,
166
- "grad_norm": 0.8018546104431152,
167
  "learning_rate": 2.778441468230483e-06,
168
- "loss": 0.4522,
169
  "step": 475
170
  },
171
  {
172
  "epoch": 14.705882352941176,
173
- "grad_norm": 1.0216737985610962,
174
  "learning_rate": 2.1940646731880887e-06,
175
- "loss": 0.447,
176
  "step": 500
177
  },
178
  {
179
  "epoch": 14.705882352941176,
180
- "eval_accuracy": 0.9606256742179072,
181
- "eval_loss": 0.27990368008613586,
182
- "eval_runtime": 3.4455,
183
- "eval_samples_per_second": 538.087,
184
- "eval_steps_per_second": 2.322,
185
  "step": 500
186
  },
187
  {
188
  "epoch": 15.441176470588236,
189
- "grad_norm": 1.5922119617462158,
190
  "learning_rate": 1.6610612060565235e-06,
191
- "loss": 0.4376,
192
  "step": 525
193
  },
194
  {
195
  "epoch": 16.176470588235293,
196
- "grad_norm": 0.8803838491439819,
197
  "learning_rate": 1.1891897243618184e-06,
198
- "loss": 0.446,
199
  "step": 550
200
  },
201
  {
202
  "epoch": 16.91176470588235,
203
- "grad_norm": 1.0972355604171753,
204
  "learning_rate": 7.870896319167548e-07,
205
- "loss": 0.4368,
206
  "step": 575
207
  },
208
  {
209
  "epoch": 17.647058823529413,
210
- "grad_norm": 1.1943304538726807,
211
  "learning_rate": 4.6212290164521554e-07,
212
- "loss": 0.4321,
213
  "step": 600
214
  },
215
  {
216
  "epoch": 18.38235294117647,
217
- "grad_norm": 0.9729615449905396,
218
  "learning_rate": 2.2023928664194229e-07,
219
- "loss": 0.4283,
220
  "step": 625
221
  },
222
  {
223
  "epoch": 18.38235294117647,
224
- "eval_accuracy": 0.9606256742179072,
225
- "eval_loss": 0.2707391679286957,
226
- "eval_runtime": 3.4368,
227
- "eval_samples_per_second": 539.461,
228
- "eval_steps_per_second": 2.328,
229
  "step": 625
230
  },
231
  {
232
  "epoch": 19.11764705882353,
233
- "grad_norm": 1.2270188331604004,
234
  "learning_rate": 6.58673872923693e-08,
235
- "loss": 0.4379,
236
  "step": 650
237
  },
238
  {
239
  "epoch": 19.852941176470587,
240
- "grad_norm": 0.9648692011833191,
241
  "learning_rate": 1.8335688835802169e-09,
242
- "loss": 0.4281,
243
  "step": 675
244
  },
245
  {
246
  "epoch": 20.0,
247
  "step": 680,
248
  "total_flos": 1.3409213882909e+19,
249
- "train_loss": 0.49313004542799554,
250
- "train_runtime": 263.7994,
251
- "train_samples_per_second": 655.953,
252
- "train_steps_per_second": 2.578
253
  }
254
  ],
255
  "logging_steps": 25,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.7352941176470589,
13
+ "grad_norm": 0.32342442870140076,
14
  "learning_rate": 2.5e-06,
15
+ "loss": 0.7033,
16
  "step": 25
17
  },
18
  {
19
  "epoch": 1.4705882352941178,
20
+ "grad_norm": 0.5360887050628662,
21
  "learning_rate": 5e-06,
22
+ "loss": 0.6638,
23
  "step": 50
24
  },
25
  {
26
  "epoch": 2.2058823529411766,
27
+ "grad_norm": 0.32269367575645447,
28
  "learning_rate": 7.500000000000001e-06,
29
+ "loss": 0.5639,
30
  "step": 75
31
  },
32
  {
33
  "epoch": 2.9411764705882355,
34
+ "grad_norm": 0.3643856644630432,
35
  "learning_rate": 1e-05,
36
+ "loss": 0.5276,
37
  "step": 100
38
  },
39
  {
40
  "epoch": 3.6764705882352944,
41
+ "grad_norm": 0.3383520543575287,
42
  "learning_rate": 9.954227982894034e-06,
43
+ "loss": 0.5283,
44
  "step": 125
45
  },
46
  {
47
  "epoch": 3.6764705882352944,
48
  "eval_accuracy": 0.9606256742179072,
49
+ "eval_loss": 0.29475122690200806,
50
+ "eval_runtime": 3.6867,
51
+ "eval_samples_per_second": 502.885,
52
+ "eval_steps_per_second": 2.17,
53
  "step": 125
54
  },
55
  {
56
  "epoch": 4.411764705882353,
57
+ "grad_norm": 0.3172575831413269,
58
  "learning_rate": 9.817749962596115e-06,
59
+ "loss": 0.5181,
60
  "step": 150
61
  },
62
  {
63
  "epoch": 5.147058823529412,
64
+ "grad_norm": 0.2688044309616089,
65
  "learning_rate": 9.59306468881811e-06,
66
+ "loss": 0.5133,
67
  "step": 175
68
  },
69
  {
70
  "epoch": 5.882352941176471,
71
+ "grad_norm": 0.47131991386413574,
72
  "learning_rate": 9.284285880837947e-06,
73
+ "loss": 0.5142,
74
  "step": 200
75
  },
76
  {
77
  "epoch": 6.617647058823529,
78
+ "grad_norm": 0.437072217464447,
79
  "learning_rate": 8.897066910207958e-06,
80
+ "loss": 0.5043,
81
  "step": 225
82
  },
83
  {
84
  "epoch": 7.352941176470588,
85
+ "grad_norm": 0.9283384084701538,
86
  "learning_rate": 8.438497294267117e-06,
87
+ "loss": 0.516,
88
  "step": 250
89
  },
90
  {
91
  "epoch": 7.352941176470588,
92
+ "eval_accuracy": 0.9600862998921251,
93
+ "eval_loss": 0.28430742025375366,
94
+ "eval_runtime": 3.3555,
95
+ "eval_samples_per_second": 552.534,
96
+ "eval_steps_per_second": 2.384,
97
  "step": 250
98
  },
99
  {
100
  "epoch": 8.088235294117647,
101
+ "grad_norm": 0.4921472370624542,
102
  "learning_rate": 7.916972895537471e-06,
103
+ "loss": 0.5053,
104
  "step": 275
105
  },
106
  {
107
  "epoch": 8.823529411764707,
108
+ "grad_norm": 0.6513373851776123,
109
  "learning_rate": 7.342042203498952e-06,
110
+ "loss": 0.5023,
111
  "step": 300
112
  },
113
  {
114
  "epoch": 9.558823529411764,
115
+ "grad_norm": 0.5955798625946045,
116
  "learning_rate": 6.724231513139853e-06,
117
+ "loss": 0.5046,
118
  "step": 325
119
  },
120
  {
121
  "epoch": 10.294117647058824,
122
+ "grad_norm": 0.5370674729347229,
123
  "learning_rate": 6.074852201055121e-06,
124
+ "loss": 0.4918,
125
  "step": 350
126
  },
127
  {
128
  "epoch": 11.029411764705882,
129
+ "grad_norm": 0.6328652501106262,
130
  "learning_rate": 5.405793627637157e-06,
131
+ "loss": 0.4878,
132
  "step": 375
133
  },
134
  {
135
  "epoch": 11.029411764705882,
136
+ "eval_accuracy": 0.9600862998921251,
137
+ "eval_loss": 0.275637149810791,
138
+ "eval_runtime": 3.4137,
139
+ "eval_samples_per_second": 543.107,
140
+ "eval_steps_per_second": 2.344,
141
  "step": 375
142
  },
143
  {
144
  "epoch": 11.764705882352942,
145
+ "grad_norm": 1.029469609260559,
146
  "learning_rate": 4.729305457072913e-06,
147
+ "loss": 0.4806,
148
  "step": 400
149
  },
150
  {
151
  "epoch": 12.5,
152
+ "grad_norm": 0.7929940223693848,
153
  "learning_rate": 4.057773380608411e-06,
154
+ "loss": 0.4819,
155
  "step": 425
156
  },
157
  {
158
  "epoch": 13.235294117647058,
159
+ "grad_norm": 0.8358489871025085,
160
  "learning_rate": 3.403492349320101e-06,
161
+ "loss": 0.4693,
162
  "step": 450
163
  },
164
  {
165
  "epoch": 13.970588235294118,
166
+ "grad_norm": 1.030651569366455,
167
  "learning_rate": 2.778441468230483e-06,
168
+ "loss": 0.4632,
169
  "step": 475
170
  },
171
  {
172
  "epoch": 14.705882352941176,
173
+ "grad_norm": 1.082851529121399,
174
  "learning_rate": 2.1940646731880887e-06,
175
+ "loss": 0.459,
176
  "step": 500
177
  },
178
  {
179
  "epoch": 14.705882352941176,
180
+ "eval_accuracy": 0.9600862998921251,
181
+ "eval_loss": 0.2800777554512024,
182
+ "eval_runtime": 3.4811,
183
+ "eval_samples_per_second": 532.584,
184
+ "eval_steps_per_second": 2.298,
185
  "step": 500
186
  },
187
  {
188
  "epoch": 15.441176470588236,
189
+ "grad_norm": 0.9598743319511414,
190
  "learning_rate": 1.6610612060565235e-06,
191
+ "loss": 0.4518,
192
  "step": 525
193
  },
194
  {
195
  "epoch": 16.176470588235293,
196
+ "grad_norm": 0.8586243987083435,
197
  "learning_rate": 1.1891897243618184e-06,
198
+ "loss": 0.4604,
199
  "step": 550
200
  },
201
  {
202
  "epoch": 16.91176470588235,
203
+ "grad_norm": 1.1040153503417969,
204
  "learning_rate": 7.870896319167548e-07,
205
+ "loss": 0.4542,
206
  "step": 575
207
  },
208
  {
209
  "epoch": 17.647058823529413,
210
+ "grad_norm": 0.8632078766822815,
211
  "learning_rate": 4.6212290164521554e-07,
212
+ "loss": 0.4473,
213
  "step": 600
214
  },
215
  {
216
  "epoch": 18.38235294117647,
217
+ "grad_norm": 0.9933310151100159,
218
  "learning_rate": 2.2023928664194229e-07,
219
+ "loss": 0.4462,
220
  "step": 625
221
  },
222
  {
223
  "epoch": 18.38235294117647,
224
+ "eval_accuracy": 0.959546925566343,
225
+ "eval_loss": 0.2760601043701172,
226
+ "eval_runtime": 3.319,
227
+ "eval_samples_per_second": 558.602,
228
+ "eval_steps_per_second": 2.41,
229
  "step": 625
230
  },
231
  {
232
  "epoch": 19.11764705882353,
233
+ "grad_norm": 0.9852302074432373,
234
  "learning_rate": 6.58673872923693e-08,
235
+ "loss": 0.4523,
236
  "step": 650
237
  },
238
  {
239
  "epoch": 19.852941176470587,
240
+ "grad_norm": 0.8414192795753479,
241
  "learning_rate": 1.8335688835802169e-09,
242
+ "loss": 0.4441,
243
  "step": 675
244
  },
245
  {
246
  "epoch": 20.0,
247
  "step": 680,
248
  "total_flos": 1.3409213882909e+19,
249
+ "train_loss": 0.5017087179071763,
250
+ "train_runtime": 256.3708,
251
+ "train_samples_per_second": 674.96,
252
+ "train_steps_per_second": 2.652
253
  }
254
  ],
255
  "logging_steps": 25,