ahmedALM1221 commited on
Commit
b809a67
·
1 Parent(s): 6b04b91

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -6,8 +6,8 @@
6
  "eval_samples_per_second": 79.633,
7
  "eval_steps_per_second": 4.977,
8
  "total_flos": 4.860822854913491e+18,
9
- "train_loss": 1.0101308201298569,
10
- "train_runtime": 2441.1089,
11
- "train_samples_per_second": 8.647,
12
- "train_steps_per_second": 0.135
13
  }
 
6
  "eval_samples_per_second": 79.633,
7
  "eval_steps_per_second": 4.977,
8
  "total_flos": 4.860822854913491e+18,
9
+ "train_loss": 0.3027138883417303,
10
+ "train_runtime": 956.6189,
11
+ "train_samples_per_second": 22.065,
12
+ "train_steps_per_second": 0.345
13
  }
runs/Jul05_15-01-11_c8d5d7484861/events.out.tfevents.1688574849.c8d5d7484861.2170.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c8f05691efcb2629cddd73085bc3e001f1dda740e0a3d8d17ee5b11298c8921
3
+ size 5772
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 6.0,
3
  "total_flos": 4.860822854913491e+18,
4
- "train_loss": 1.0101308201298569,
5
- "train_runtime": 2441.1089,
6
- "train_samples_per_second": 8.647,
7
- "train_steps_per_second": 0.135
8
  }
 
1
  {
2
  "epoch": 6.0,
3
  "total_flos": 4.860822854913491e+18,
4
+ "train_loss": 0.3027138883417303,
5
+ "train_runtime": 956.6189,
6
+ "train_samples_per_second": 22.065,
7
+ "train_steps_per_second": 0.345
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8795454545454545,
3
  "best_model_checkpoint": "swinv2-large-patch4-window12to16-192to256-22kto1k-ft-finetuned-eurosat-50/checkpoint-330",
4
  "epoch": 6.0,
5
  "global_step": 330,
@@ -10,263 +10,263 @@
10
  {
11
  "epoch": 0.18,
12
  "learning_rate": 6.060606060606061e-07,
13
- "loss": 2.0126,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.36,
18
  "learning_rate": 1.2121212121212122e-06,
19
- "loss": 2.0149,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.55,
24
  "learning_rate": 1.8181818181818183e-06,
25
- "loss": 1.9557,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.73,
30
  "learning_rate": 2.4242424242424244e-06,
31
- "loss": 1.9057,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.91,
36
  "learning_rate": 3.0303030303030305e-06,
37
- "loss": 1.8498,
38
  "step": 50
39
  },
40
  {
41
  "epoch": 1.0,
42
- "eval_accuracy": 0.32727272727272727,
43
- "eval_loss": 1.734784483909607,
44
- "eval_runtime": 359.3738,
45
- "eval_samples_per_second": 2.449,
46
- "eval_steps_per_second": 0.153,
47
  "step": 55
48
  },
49
  {
50
  "epoch": 1.09,
51
  "learning_rate": 3.6363636363636366e-06,
52
- "loss": 1.7745,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.27,
57
  "learning_rate": 4.242424242424243e-06,
58
- "loss": 1.7178,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.45,
63
  "learning_rate": 4.848484848484849e-06,
64
- "loss": 1.5662,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 1.64,
69
  "learning_rate": 5.4545454545454545e-06,
70
- "loss": 1.4263,
71
  "step": 90
72
  },
73
  {
74
  "epoch": 1.82,
75
  "learning_rate": 6.060606060606061e-06,
76
- "loss": 1.2797,
77
  "step": 100
78
  },
79
  {
80
  "epoch": 2.0,
81
  "learning_rate": 6.666666666666667e-06,
82
- "loss": 1.1886,
83
  "step": 110
84
  },
85
  {
86
  "epoch": 2.0,
87
- "eval_accuracy": 0.6102272727272727,
88
- "eval_loss": 1.019785761833191,
89
- "eval_runtime": 11.0093,
90
- "eval_samples_per_second": 79.933,
91
- "eval_steps_per_second": 4.996,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.18,
96
  "learning_rate": 7.272727272727273e-06,
97
- "loss": 1.099,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 2.36,
102
  "learning_rate": 7.87878787878788e-06,
103
- "loss": 1.0145,
104
  "step": 130
105
  },
106
  {
107
  "epoch": 2.55,
108
  "learning_rate": 8.484848484848486e-06,
109
- "loss": 0.9682,
110
  "step": 140
111
  },
112
  {
113
  "epoch": 2.73,
114
  "learning_rate": 9.090909090909091e-06,
115
- "loss": 0.9164,
116
  "step": 150
117
  },
118
  {
119
  "epoch": 2.91,
120
  "learning_rate": 9.696969696969698e-06,
121
- "loss": 0.8636,
122
  "step": 160
123
  },
124
  {
125
  "epoch": 3.0,
126
- "eval_accuracy": 0.7397727272727272,
127
- "eval_loss": 0.6859003305435181,
128
- "eval_runtime": 10.9928,
129
- "eval_samples_per_second": 80.052,
130
- "eval_steps_per_second": 5.003,
131
  "step": 165
132
  },
133
  {
134
  "epoch": 3.09,
135
  "learning_rate": 9.696969696969698e-06,
136
- "loss": 0.8709,
137
  "step": 170
138
  },
139
  {
140
  "epoch": 3.27,
141
  "learning_rate": 9.090909090909091e-06,
142
- "loss": 0.749,
143
  "step": 180
144
  },
145
  {
146
  "epoch": 3.45,
147
  "learning_rate": 8.484848484848486e-06,
148
- "loss": 0.7015,
149
  "step": 190
150
  },
151
  {
152
  "epoch": 3.64,
153
  "learning_rate": 7.87878787878788e-06,
154
- "loss": 0.6916,
155
  "step": 200
156
  },
157
  {
158
  "epoch": 3.82,
159
  "learning_rate": 7.272727272727273e-06,
160
- "loss": 0.6508,
161
  "step": 210
162
  },
163
  {
164
  "epoch": 4.0,
165
  "learning_rate": 6.666666666666667e-06,
166
- "loss": 0.576,
167
  "step": 220
168
  },
169
  {
170
  "epoch": 4.0,
171
- "eval_accuracy": 0.8477272727272728,
172
- "eval_loss": 0.4356772005558014,
173
- "eval_runtime": 10.9979,
174
- "eval_samples_per_second": 80.015,
175
- "eval_steps_per_second": 5.001,
176
  "step": 220
177
  },
178
  {
179
  "epoch": 4.18,
180
  "learning_rate": 6.060606060606061e-06,
181
- "loss": 0.51,
182
  "step": 230
183
  },
184
  {
185
  "epoch": 4.36,
186
  "learning_rate": 5.4545454545454545e-06,
187
- "loss": 0.5592,
188
  "step": 240
189
  },
190
  {
191
  "epoch": 4.55,
192
  "learning_rate": 4.848484848484849e-06,
193
- "loss": 0.5314,
194
  "step": 250
195
  },
196
  {
197
  "epoch": 4.73,
198
  "learning_rate": 4.242424242424243e-06,
199
- "loss": 0.5021,
200
  "step": 260
201
  },
202
  {
203
  "epoch": 4.91,
204
  "learning_rate": 3.6363636363636366e-06,
205
- "loss": 0.5875,
206
  "step": 270
207
  },
208
  {
209
  "epoch": 5.0,
210
- "eval_accuracy": 0.8386363636363636,
211
- "eval_loss": 0.418759286403656,
212
- "eval_runtime": 10.9077,
213
- "eval_samples_per_second": 80.677,
214
- "eval_steps_per_second": 5.042,
215
  "step": 275
216
  },
217
  {
218
  "epoch": 5.09,
219
  "learning_rate": 3.0303030303030305e-06,
220
- "loss": 0.4782,
221
  "step": 280
222
  },
223
  {
224
  "epoch": 5.27,
225
  "learning_rate": 2.4242424242424244e-06,
226
- "loss": 0.521,
227
  "step": 290
228
  },
229
  {
230
  "epoch": 5.45,
231
  "learning_rate": 1.8181818181818183e-06,
232
- "loss": 0.451,
233
  "step": 300
234
  },
235
  {
236
  "epoch": 5.64,
237
  "learning_rate": 1.2121212121212122e-06,
238
- "loss": 0.4403,
239
  "step": 310
240
  },
241
  {
242
  "epoch": 5.82,
243
  "learning_rate": 6.060606060606061e-07,
244
- "loss": 0.4929,
245
  "step": 320
246
  },
247
  {
248
  "epoch": 6.0,
249
  "learning_rate": 0.0,
250
- "loss": 0.4677,
251
  "step": 330
252
  },
253
  {
254
  "epoch": 6.0,
255
- "eval_accuracy": 0.8795454545454545,
256
- "eval_loss": 0.3292839825153351,
257
- "eval_runtime": 10.9849,
258
- "eval_samples_per_second": 80.11,
259
- "eval_steps_per_second": 5.007,
260
  "step": 330
261
  },
262
  {
263
  "epoch": 6.0,
264
  "step": 330,
265
  "total_flos": 4.860822854913491e+18,
266
- "train_loss": 1.0101308201298569,
267
- "train_runtime": 2441.1089,
268
- "train_samples_per_second": 8.647,
269
- "train_steps_per_second": 0.135
270
  }
271
  ],
272
  "max_steps": 330,
 
1
  {
2
+ "best_metric": 0.9659090909090909,
3
  "best_model_checkpoint": "swinv2-large-patch4-window12to16-192to256-22kto1k-ft-finetuned-eurosat-50/checkpoint-330",
4
  "epoch": 6.0,
5
  "global_step": 330,
 
10
  {
11
  "epoch": 0.18,
12
  "learning_rate": 6.060606060606061e-07,
13
+ "loss": 0.3989,
14
  "step": 10
15
  },
16
  {
17
  "epoch": 0.36,
18
  "learning_rate": 1.2121212121212122e-06,
19
+ "loss": 0.4458,
20
  "step": 20
21
  },
22
  {
23
  "epoch": 0.55,
24
  "learning_rate": 1.8181818181818183e-06,
25
+ "loss": 0.4395,
26
  "step": 30
27
  },
28
  {
29
  "epoch": 0.73,
30
  "learning_rate": 2.4242424242424244e-06,
31
+ "loss": 0.4139,
32
  "step": 40
33
  },
34
  {
35
  "epoch": 0.91,
36
  "learning_rate": 3.0303030303030305e-06,
37
+ "loss": 0.4562,
38
  "step": 50
39
  },
40
  {
41
  "epoch": 1.0,
42
+ "eval_accuracy": 0.8897727272727273,
43
+ "eval_loss": 0.3206745386123657,
44
+ "eval_runtime": 10.9207,
45
+ "eval_samples_per_second": 80.581,
46
+ "eval_steps_per_second": 5.036,
47
  "step": 55
48
  },
49
  {
50
  "epoch": 1.09,
51
  "learning_rate": 3.6363636363636366e-06,
52
+ "loss": 0.424,
53
  "step": 60
54
  },
55
  {
56
  "epoch": 1.27,
57
  "learning_rate": 4.242424242424243e-06,
58
+ "loss": 0.4218,
59
  "step": 70
60
  },
61
  {
62
  "epoch": 1.45,
63
  "learning_rate": 4.848484848484849e-06,
64
+ "loss": 0.3912,
65
  "step": 80
66
  },
67
  {
68
  "epoch": 1.64,
69
  "learning_rate": 5.4545454545454545e-06,
70
+ "loss": 0.3665,
71
  "step": 90
72
  },
73
  {
74
  "epoch": 1.82,
75
  "learning_rate": 6.060606060606061e-06,
76
+ "loss": 0.3969,
77
  "step": 100
78
  },
79
  {
80
  "epoch": 2.0,
81
  "learning_rate": 6.666666666666667e-06,
82
+ "loss": 0.372,
83
  "step": 110
84
  },
85
  {
86
  "epoch": 2.0,
87
+ "eval_accuracy": 0.9068181818181819,
88
+ "eval_loss": 0.2666811943054199,
89
+ "eval_runtime": 10.9113,
90
+ "eval_samples_per_second": 80.65,
91
+ "eval_steps_per_second": 5.041,
92
  "step": 110
93
  },
94
  {
95
  "epoch": 2.18,
96
  "learning_rate": 7.272727272727273e-06,
97
+ "loss": 0.35,
98
  "step": 120
99
  },
100
  {
101
  "epoch": 2.36,
102
  "learning_rate": 7.87878787878788e-06,
103
+ "loss": 0.275,
104
  "step": 130
105
  },
106
  {
107
  "epoch": 2.55,
108
  "learning_rate": 8.484848484848486e-06,
109
+ "loss": 0.2911,
110
  "step": 140
111
  },
112
  {
113
  "epoch": 2.73,
114
  "learning_rate": 9.090909090909091e-06,
115
+ "loss": 0.2794,
116
  "step": 150
117
  },
118
  {
119
  "epoch": 2.91,
120
  "learning_rate": 9.696969696969698e-06,
121
+ "loss": 0.2776,
122
  "step": 160
123
  },
124
  {
125
  "epoch": 3.0,
126
+ "eval_accuracy": 0.9125,
127
+ "eval_loss": 0.2862165570259094,
128
+ "eval_runtime": 11.069,
129
+ "eval_samples_per_second": 79.501,
130
+ "eval_steps_per_second": 4.969,
131
  "step": 165
132
  },
133
  {
134
  "epoch": 3.09,
135
  "learning_rate": 9.696969696969698e-06,
136
+ "loss": 0.3096,
137
  "step": 170
138
  },
139
  {
140
  "epoch": 3.27,
141
  "learning_rate": 9.090909090909091e-06,
142
+ "loss": 0.2071,
143
  "step": 180
144
  },
145
  {
146
  "epoch": 3.45,
147
  "learning_rate": 8.484848484848486e-06,
148
+ "loss": 0.2234,
149
  "step": 190
150
  },
151
  {
152
  "epoch": 3.64,
153
  "learning_rate": 7.87878787878788e-06,
154
+ "loss": 0.2446,
155
  "step": 200
156
  },
157
  {
158
  "epoch": 3.82,
159
  "learning_rate": 7.272727272727273e-06,
160
+ "loss": 0.1926,
161
  "step": 210
162
  },
163
  {
164
  "epoch": 4.0,
165
  "learning_rate": 6.666666666666667e-06,
166
+ "loss": 0.2018,
167
  "step": 220
168
  },
169
  {
170
  "epoch": 4.0,
171
+ "eval_accuracy": 0.9397727272727273,
172
+ "eval_loss": 0.19657106697559357,
173
+ "eval_runtime": 10.9849,
174
+ "eval_samples_per_second": 80.11,
175
+ "eval_steps_per_second": 5.007,
176
  "step": 220
177
  },
178
  {
179
  "epoch": 4.18,
180
  "learning_rate": 6.060606060606061e-06,
181
+ "loss": 0.1894,
182
  "step": 230
183
  },
184
  {
185
  "epoch": 4.36,
186
  "learning_rate": 5.4545454545454545e-06,
187
+ "loss": 0.2126,
188
  "step": 240
189
  },
190
  {
191
  "epoch": 4.55,
192
  "learning_rate": 4.848484848484849e-06,
193
+ "loss": 0.2101,
194
  "step": 250
195
  },
196
  {
197
  "epoch": 4.73,
198
  "learning_rate": 4.242424242424243e-06,
199
+ "loss": 0.2062,
200
  "step": 260
201
  },
202
  {
203
  "epoch": 4.91,
204
  "learning_rate": 3.6363636363636366e-06,
205
+ "loss": 0.2751,
206
  "step": 270
207
  },
208
  {
209
  "epoch": 5.0,
210
+ "eval_accuracy": 0.9375,
211
+ "eval_loss": 0.1937328726053238,
212
+ "eval_runtime": 10.9353,
213
+ "eval_samples_per_second": 80.474,
214
+ "eval_steps_per_second": 5.03,
215
  "step": 275
216
  },
217
  {
218
  "epoch": 5.09,
219
  "learning_rate": 3.0303030303030305e-06,
220
+ "loss": 0.219,
221
  "step": 280
222
  },
223
  {
224
  "epoch": 5.27,
225
  "learning_rate": 2.4242424242424244e-06,
226
+ "loss": 0.2875,
227
  "step": 290
228
  },
229
  {
230
  "epoch": 5.45,
231
  "learning_rate": 1.8181818181818183e-06,
232
+ "loss": 0.2401,
233
  "step": 300
234
  },
235
  {
236
  "epoch": 5.64,
237
  "learning_rate": 1.2121212121212122e-06,
238
+ "loss": 0.2208,
239
  "step": 310
240
  },
241
  {
242
  "epoch": 5.82,
243
  "learning_rate": 6.060606060606061e-07,
244
+ "loss": 0.2734,
245
  "step": 320
246
  },
247
  {
248
  "epoch": 6.0,
249
  "learning_rate": 0.0,
250
+ "loss": 0.2764,
251
  "step": 330
252
  },
253
  {
254
  "epoch": 6.0,
255
+ "eval_accuracy": 0.9659090909090909,
256
+ "eval_loss": 0.11989254504442215,
257
+ "eval_runtime": 11.0047,
258
+ "eval_samples_per_second": 79.966,
259
+ "eval_steps_per_second": 4.998,
260
  "step": 330
261
  },
262
  {
263
  "epoch": 6.0,
264
  "step": 330,
265
  "total_flos": 4.860822854913491e+18,
266
+ "train_loss": 0.3027138883417303,
267
+ "train_runtime": 956.6189,
268
+ "train_samples_per_second": 22.065,
269
+ "train_steps_per_second": 0.345
270
  }
271
  ],
272
  "max_steps": 330,