tenFnAN commited on
Commit
47117d7
·
verified ·
1 Parent(s): fa02a71

Model save

Browse files
README.md CHANGED
@@ -18,8 +18,8 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.5612
22
- - Accuracy: 0.7935
23
 
24
  ## Model description
25
 
@@ -52,10 +52,10 @@ The following hyperparameters were used during training:
52
 
53
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
54
  |:-------------:|:------:|:----:|:---------------:|:--------:|
55
- | 2.1719 | 0.2568 | 38 | 2.0526 | 0.1714 |
56
- | 1.4069 | 1.2568 | 76 | 1.2280 | 0.4714 |
57
- | 0.6534 | 2.2568 | 114 | 0.7264 | 0.7 |
58
- | 0.3677 | 3.2297 | 148 | 0.5529 | 0.8 |
59
 
60
 
61
  ### Framework versions
 
18
 
19
  This model is a fine-tuned version of [MCG-NJU/videomae-base](https://huggingface.co/MCG-NJU/videomae-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 0.3988
22
+ - Accuracy: 0.8714
23
 
24
  ## Model description
25
 
 
52
 
53
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
54
  |:-------------:|:------:|:----:|:---------------:|:--------:|
55
+ | 2.1392 | 0.2568 | 38 | 1.8769 | 0.4143 |
56
+ | 1.0079 | 1.2568 | 76 | 0.9862 | 0.7286 |
57
+ | 0.4814 | 2.2568 | 114 | 0.5106 | 0.8857 |
58
+ | 0.3286 | 3.2297 | 148 | 0.3988 | 0.8714 |
59
 
60
 
61
  ### Framework versions
all_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.22972972972973,
3
- "eval_accuracy": 0.7935483870967742,
4
- "eval_loss": 0.5611749291419983,
5
- "eval_runtime": 7.9378,
6
- "eval_samples_per_second": 19.527,
7
- "eval_steps_per_second": 2.52
8
  }
 
1
  {
2
  "epoch": 3.22972972972973,
3
+ "eval_accuracy": 0.8064516129032258,
4
+ "eval_loss": 0.5119282603263855,
5
+ "eval_runtime": 8.1588,
6
+ "eval_samples_per_second": 18.998,
7
+ "eval_steps_per_second": 2.451
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37a1911d5bea29d14fd90e9de8f41ae225fd93992cce7669f3dfcabdb0d9f7c2
3
  size 344961984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e9782a92fe2b92d055c33d710abfcc464ea7d62fbe46fdb190fd0425137b6ec
3
  size 344961984
runs/Dec09_21-13-29_psroka/events.out.tfevents.1733776568.psroka.814400.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76522f4b5ba1d595c1a2886a016d42b55605e664ef5c9005a887f2eb26f131fe
3
- size 8974
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bd07efd3e0816d797b9333d4833b4946f392cdcaebe2e5440cfa6f851c7646a
3
+ size 10280
runs/Dec09_21-13-29_psroka/events.out.tfevents.1733776831.psroka.814400.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e92dc18f22572168499bd1ee5ef4188ba27b95050f95fb3880bfd9d2eba77d7
3
+ size 411
runs/Dec09_21-53-53_psroka/events.out.tfevents.1733777647.psroka.827004.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8b9549d01cb49190bff93e568409bc7bdd1485d0503193ffa9f7000927a3f78
3
+ size 10280
test_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 3.22972972972973,
3
- "eval_accuracy": 0.7935483870967742,
4
- "eval_loss": 0.5611749291419983,
5
- "eval_runtime": 7.9378,
6
- "eval_samples_per_second": 19.527,
7
- "eval_steps_per_second": 2.52
8
  }
 
1
  {
2
  "epoch": 3.22972972972973,
3
+ "eval_accuracy": 0.8064516129032258,
4
+ "eval_loss": 0.5119282603263855,
5
+ "eval_runtime": 8.1588,
6
+ "eval_samples_per_second": 18.998,
7
+ "eval_steps_per_second": 2.451
8
  }
trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.8,
3
  "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset\\checkpoint-148",
4
  "epoch": 3.22972972972973,
5
  "eval_steps": 500,
@@ -10,172 +10,154 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.06756756756756757,
13
- "grad_norm": 16.5500545501709,
14
- "learning_rate": 2.6666666666666667e-05,
15
- "loss": 2.3071,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.13513513513513514,
20
- "grad_norm": 7.210005760192871,
21
  "learning_rate": 4.9248120300751884e-05,
22
- "loss": 2.2612,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.20270270270270271,
27
- "grad_norm": 7.997417449951172,
28
  "learning_rate": 4.548872180451128e-05,
29
- "loss": 2.1719,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.25675675675675674,
34
- "eval_accuracy": 0.17142857142857143,
35
- "eval_loss": 2.0525670051574707,
36
- "eval_runtime": 3.6401,
37
- "eval_samples_per_second": 19.23,
38
- "eval_steps_per_second": 2.472,
39
  "step": 38
40
  },
41
  {
42
  "epoch": 1.0135135135135136,
43
- "grad_norm": 7.0121283531188965,
44
  "learning_rate": 4.172932330827068e-05,
45
- "loss": 1.9451,
46
  "step": 40
47
  },
48
  {
49
  "epoch": 1.0810810810810811,
50
- "grad_norm": 11.407858848571777,
51
  "learning_rate": 3.796992481203008e-05,
52
- "loss": 1.7221,
53
  "step": 50
54
  },
55
  {
56
  "epoch": 1.1486486486486487,
57
- "grad_norm": 14.631987571716309,
58
  "learning_rate": 3.421052631578947e-05,
59
- "loss": 1.4956,
60
  "step": 60
61
  },
62
  {
63
  "epoch": 1.2162162162162162,
64
- "grad_norm": 9.013343811035156,
65
  "learning_rate": 3.0451127819548874e-05,
66
- "loss": 1.4069,
67
  "step": 70
68
  },
69
  {
70
  "epoch": 1.2567567567567568,
71
- "eval_accuracy": 0.4714285714285714,
72
- "eval_loss": 1.2280380725860596,
73
- "eval_runtime": 3.6911,
74
- "eval_samples_per_second": 18.964,
75
- "eval_steps_per_second": 2.438,
76
  "step": 76
77
  },
78
  {
79
  "epoch": 2.027027027027027,
80
- "grad_norm": 9.636581420898438,
81
  "learning_rate": 2.6691729323308275e-05,
82
- "loss": 0.995,
83
  "step": 80
84
  },
85
  {
86
  "epoch": 2.0945945945945947,
87
- "grad_norm": 9.935404777526855,
88
  "learning_rate": 2.293233082706767e-05,
89
- "loss": 0.8051,
90
  "step": 90
91
  },
92
  {
93
  "epoch": 2.1621621621621623,
94
- "grad_norm": 9.97338581085205,
95
  "learning_rate": 1.9172932330827066e-05,
96
- "loss": 0.8465,
97
  "step": 100
98
  },
99
  {
100
  "epoch": 2.22972972972973,
101
- "grad_norm": 8.2127103805542,
102
  "learning_rate": 1.5413533834586467e-05,
103
- "loss": 0.6534,
104
  "step": 110
105
  },
106
  {
107
  "epoch": 2.2567567567567566,
108
- "eval_accuracy": 0.7,
109
- "eval_loss": 0.7263602018356323,
110
- "eval_runtime": 3.6476,
111
- "eval_samples_per_second": 19.191,
112
- "eval_steps_per_second": 2.467,
113
  "step": 114
114
  },
115
  {
116
  "epoch": 3.0405405405405403,
117
- "grad_norm": 8.435063362121582,
118
  "learning_rate": 1.1654135338345864e-05,
119
- "loss": 0.5543,
120
  "step": 120
121
  },
122
  {
123
  "epoch": 3.108108108108108,
124
- "grad_norm": 3.56019926071167,
125
  "learning_rate": 7.894736842105263e-06,
126
- "loss": 0.4172,
127
  "step": 130
128
  },
129
  {
130
  "epoch": 3.175675675675676,
131
- "grad_norm": 7.430360317230225,
132
  "learning_rate": 4.135338345864662e-06,
133
- "loss": 0.3677,
134
  "step": 140
135
  },
136
  {
137
  "epoch": 3.22972972972973,
138
- "eval_accuracy": 0.8,
139
- "eval_loss": 0.552931547164917,
140
- "eval_runtime": 3.5081,
141
- "eval_samples_per_second": 19.954,
142
- "eval_steps_per_second": 2.565,
143
  "step": 148
144
  },
145
  {
146
  "epoch": 3.22972972972973,
147
  "step": 148,
148
  "total_flos": 1.460491890402263e+18,
149
- "train_loss": 1.2348162676836993,
150
- "train_runtime": 139.5019,
151
- "train_samples_per_second": 8.487,
152
- "train_steps_per_second": 1.061
153
  },
154
  {
155
  "epoch": 3.22972972972973,
156
- "eval_accuracy": 0.7935483870967742,
157
- "eval_loss": 0.561172604560852,
158
- "eval_runtime": 7.6883,
159
- "eval_samples_per_second": 20.161,
160
- "eval_steps_per_second": 2.601,
161
- "step": 148
162
- },
163
- {
164
- "epoch": 3.22972972972973,
165
- "eval_accuracy": 0.7935483870967742,
166
- "eval_loss": 0.5611749291419983,
167
- "eval_runtime": 7.9378,
168
- "eval_samples_per_second": 19.527,
169
- "eval_steps_per_second": 2.52,
170
- "step": 148
171
- },
172
- {
173
- "epoch": 3.22972972972973,
174
- "eval_accuracy": 0.7935483870967742,
175
- "eval_loss": 0.5611773133277893,
176
- "eval_runtime": 7.4937,
177
- "eval_samples_per_second": 20.684,
178
- "eval_steps_per_second": 2.669,
179
  "step": 148
180
  }
181
  ],
 
1
  {
2
+ "best_metric": 0.8714285714285714,
3
  "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset\\checkpoint-148",
4
  "epoch": 3.22972972972973,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.06756756756756757,
13
+ "grad_norm": 11.614557266235352,
14
+ "learning_rate": 2.3333333333333336e-05,
15
+ "loss": 2.3407,
16
  "step": 10
17
  },
18
  {
19
  "epoch": 0.13513513513513514,
20
+ "grad_norm": 7.542444229125977,
21
  "learning_rate": 4.9248120300751884e-05,
22
+ "loss": 2.2367,
23
  "step": 20
24
  },
25
  {
26
  "epoch": 0.20270270270270271,
27
+ "grad_norm": 8.507399559020996,
28
  "learning_rate": 4.548872180451128e-05,
29
+ "loss": 2.201,
30
  "step": 30
31
  },
32
  {
33
  "epoch": 0.25675675675675674,
34
+ "eval_accuracy": 0.5428571428571428,
35
+ "eval_loss": 1.803983211517334,
36
+ "eval_runtime": 3.6229,
37
+ "eval_samples_per_second": 19.322,
38
+ "eval_steps_per_second": 2.484,
39
  "step": 38
40
  },
41
  {
42
  "epoch": 1.0135135135135136,
43
+ "grad_norm": 9.280707359313965,
44
  "learning_rate": 4.172932330827068e-05,
45
+ "loss": 2.0,
46
  "step": 40
47
  },
48
  {
49
  "epoch": 1.0810810810810811,
50
+ "grad_norm": 10.3395357131958,
51
  "learning_rate": 3.796992481203008e-05,
52
+ "loss": 1.6049,
53
  "step": 50
54
  },
55
  {
56
  "epoch": 1.1486486486486487,
57
+ "grad_norm": 9.636208534240723,
58
  "learning_rate": 3.421052631578947e-05,
59
+ "loss": 1.2228,
60
  "step": 60
61
  },
62
  {
63
  "epoch": 1.2162162162162162,
64
+ "grad_norm": 7.421963691711426,
65
  "learning_rate": 3.0451127819548874e-05,
66
+ "loss": 0.9633,
67
  "step": 70
68
  },
69
  {
70
  "epoch": 1.2567567567567568,
71
+ "eval_accuracy": 0.6285714285714286,
72
+ "eval_loss": 0.8886963129043579,
73
+ "eval_runtime": 3.7412,
74
+ "eval_samples_per_second": 18.711,
75
+ "eval_steps_per_second": 2.406,
76
  "step": 76
77
  },
78
  {
79
  "epoch": 2.027027027027027,
80
+ "grad_norm": 10.210707664489746,
81
  "learning_rate": 2.6691729323308275e-05,
82
+ "loss": 0.794,
83
  "step": 80
84
  },
85
  {
86
  "epoch": 2.0945945945945947,
87
+ "grad_norm": 11.060843467712402,
88
  "learning_rate": 2.293233082706767e-05,
89
+ "loss": 0.6296,
90
  "step": 90
91
  },
92
  {
93
  "epoch": 2.1621621621621623,
94
+ "grad_norm": 10.571476936340332,
95
  "learning_rate": 1.9172932330827066e-05,
96
+ "loss": 0.5047,
97
  "step": 100
98
  },
99
  {
100
  "epoch": 2.22972972972973,
101
+ "grad_norm": 5.044342041015625,
102
  "learning_rate": 1.5413533834586467e-05,
103
+ "loss": 0.4839,
104
  "step": 110
105
  },
106
  {
107
  "epoch": 2.2567567567567566,
108
+ "eval_accuracy": 0.7714285714285715,
109
+ "eval_loss": 0.599827229976654,
110
+ "eval_runtime": 3.9209,
111
+ "eval_samples_per_second": 17.853,
112
+ "eval_steps_per_second": 2.295,
113
  "step": 114
114
  },
115
  {
116
  "epoch": 3.0405405405405403,
117
+ "grad_norm": 8.765264511108398,
118
  "learning_rate": 1.1654135338345864e-05,
119
+ "loss": 0.3181,
120
  "step": 120
121
  },
122
  {
123
  "epoch": 3.108108108108108,
124
+ "grad_norm": 3.8785786628723145,
125
  "learning_rate": 7.894736842105263e-06,
126
+ "loss": 0.2858,
127
  "step": 130
128
  },
129
  {
130
  "epoch": 3.175675675675676,
131
+ "grad_norm": 2.8601646423339844,
132
  "learning_rate": 4.135338345864662e-06,
133
+ "loss": 0.2545,
134
  "step": 140
135
  },
136
  {
137
  "epoch": 3.22972972972973,
138
+ "eval_accuracy": 0.8714285714285714,
139
+ "eval_loss": 0.40526869893074036,
140
+ "eval_runtime": 3.6308,
141
+ "eval_samples_per_second": 19.28,
142
+ "eval_steps_per_second": 2.479,
143
  "step": 148
144
  },
145
  {
146
  "epoch": 3.22972972972973,
147
  "step": 148,
148
  "total_flos": 1.460491890402263e+18,
149
+ "train_loss": 1.0872333371961438,
150
+ "train_runtime": 198.8948,
151
+ "train_samples_per_second": 5.953,
152
+ "train_steps_per_second": 0.744
153
  },
154
  {
155
  "epoch": 3.22972972972973,
156
+ "eval_accuracy": 0.8064516129032258,
157
+ "eval_loss": 0.5119282603263855,
158
+ "eval_runtime": 8.1588,
159
+ "eval_samples_per_second": 18.998,
160
+ "eval_steps_per_second": 2.451,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
161
  "step": 148
162
  }
163
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ea7cab49c4e93ed45d49ec0933d4da4a7a51594614614d7d065fefc9650ee781
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:acc02801356b15f5ed557a809a6daa80fc3b7ab0f45609a901a8689ac4560959
3
  size 5304