rlaaudrb1104 commited on
Commit
6dee97d
·
1 Parent(s): afa45ed

slicing and feature engineering

Browse files
Files changed (7) hide show
  1. config.json +5 -32
  2. model.safetensors +2 -2
  3. optimizer.pt +3 -0
  4. rng_state.pth +3 -0
  5. scheduler.pt +3 -0
  6. trainer_state.json +236 -0
  7. training_args.bin +2 -2
config.json CHANGED
@@ -1,53 +1,26 @@
1
  {
2
- "_name_or_path": "microsoft/graphcodebert-base",
3
  "architectures": [
4
- "RobertaForSequenceClassification"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "bos_token_id": 0,
8
  "classifier_dropout": null,
9
  "eos_token_id": 2,
10
- "gradient_checkpointing": false,
11
  "hidden_act": "gelu",
12
  "hidden_dropout_prob": 0.1,
13
  "hidden_size": 768,
14
- "id2label": {
15
- "0": "LABEL_0",
16
- "1": "LABEL_1",
17
- "2": "LABEL_2",
18
- "3": "LABEL_3",
19
- "4": "LABEL_4",
20
- "5": "LABEL_5",
21
- "6": "LABEL_6",
22
- "7": "LABEL_7",
23
- "8": "LABEL_8",
24
- "9": "LABEL_9"
25
- },
26
  "initializer_range": 0.02,
27
  "intermediate_size": 3072,
28
- "label2id": {
29
- "LABEL_0": 0,
30
- "LABEL_1": 1,
31
- "LABEL_2": 2,
32
- "LABEL_3": 3,
33
- "LABEL_4": 4,
34
- "LABEL_5": 5,
35
- "LABEL_6": 6,
36
- "LABEL_7": 7,
37
- "LABEL_8": 8,
38
- "LABEL_9": 9
39
- },
40
- "layer_norm_eps": 1e-05,
41
  "max_position_embeddings": 514,
42
- "model_type": "roberta",
43
  "num_attention_heads": 12,
44
  "num_hidden_layers": 12,
45
- "output_past": true,
46
  "pad_token_id": 1,
47
  "position_embedding_type": "absolute",
48
- "problem_type": "single_label_classification",
49
  "torch_dtype": "float32",
50
- "transformers_version": "4.40.1",
51
  "type_vocab_size": 1,
52
  "use_cache": true,
53
  "vocab_size": 50265
 
1
  {
 
2
  "architectures": [
3
+ "CodeBERTForVulnerabilityDetectionWithFeatures"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
  "bos_token_id": 0,
7
  "classifier_dropout": null,
8
  "eos_token_id": 2,
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
 
 
 
 
 
 
 
 
 
 
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
 
 
 
 
 
 
 
 
 
 
 
 
15
  "max_position_embeddings": 514,
16
+ "model_type": "codebert",
17
  "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
+ "output_attentions": true,
20
  "pad_token_id": 1,
21
  "position_embedding_type": "absolute",
 
22
  "torch_dtype": "float32",
23
+ "transformers_version": "4.41.1",
24
  "type_vocab_size": 1,
25
  "use_cache": true,
26
  "vocab_size": 50265
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e9fbc6c8e352b7fb9cdd20e15a359a3c1b1869da5086b212ed38025d1968db9
3
- size 498637432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9bcae3293b5d29ff9f520b875765460e825e12ec2ecccdf5fb2635ab3d058ec
3
+ size 498692860
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeda6c76b7102eb22693937d10b880ae3af91f76df0a3a54359358853fc95e33
3
+ size 997506746
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc880f662532368769bf627f8612e2c4b90986f8b4c7b89b3f45762dc6d424d
3
+ size 14244
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1b227ad2a10700168d2b014fe9a1d55c46d4ec5e2f18bd52971da8f64d4b44b
3
+ size 1064
trainer_state.json ADDED
@@ -0,0 +1,236 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 4.685408299866131,
5
+ "eval_steps": 500,
6
+ "global_step": 3500,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.6693440428380187,
13
+ "grad_norm": 14.38033676147461,
14
+ "learning_rate": 4.97e-05,
15
+ "loss": 1.6741,
16
+ "step": 500
17
+ },
18
+ {
19
+ "epoch": 0.6693440428380187,
20
+ "eval_accuracy": 0.6358458961474037,
21
+ "eval_f1_class_0": 0.9606299212598425,
22
+ "eval_f1_class_1": 0.4562647754137116,
23
+ "eval_f1_class_2": 0.5818673883626523,
24
+ "eval_f1_class_3": 0.6752,
25
+ "eval_f1_class_4": 0.4695259593679458,
26
+ "eval_f1_class_5": 0.6699186991869919,
27
+ "eval_f1_class_6": 0.6111908177905309,
28
+ "eval_f1_class_7": 0.6285714285714286,
29
+ "eval_f1_class_8": 0.7056603773584904,
30
+ "eval_f1_macro": 0.6398699297012882,
31
+ "eval_f1_micro": 0.6358458961474037,
32
+ "eval_f1_weighted": 0.6376816033602213,
33
+ "eval_loss": 1.0920162200927734,
34
+ "eval_recall_weighted": 0.6358458961474037,
35
+ "eval_runtime": 52.0874,
36
+ "eval_samples_per_second": 57.307,
37
+ "eval_steps_per_second": 1.805,
38
+ "step": 500
39
+ },
40
+ {
41
+ "epoch": 1.3386880856760375,
42
+ "grad_norm": 13.991486549377441,
43
+ "learning_rate": 4.643472022955524e-05,
44
+ "loss": 0.77,
45
+ "step": 1000
46
+ },
47
+ {
48
+ "epoch": 1.3386880856760375,
49
+ "eval_accuracy": 0.8395309882747068,
50
+ "eval_f1_class_0": 0.9654088050314467,
51
+ "eval_f1_class_1": 0.7083333333333334,
52
+ "eval_f1_class_2": 0.8022598870056498,
53
+ "eval_f1_class_3": 0.8431952662721893,
54
+ "eval_f1_class_4": 0.7962674961119751,
55
+ "eval_f1_class_5": 0.8715447154471545,
56
+ "eval_f1_class_6": 0.8243430152143845,
57
+ "eval_f1_class_7": 0.8963210702341138,
58
+ "eval_f1_class_8": 0.8755760368663594,
59
+ "eval_f1_macro": 0.8425832917240673,
60
+ "eval_f1_micro": 0.8395309882747068,
61
+ "eval_f1_weighted": 0.8406783887287406,
62
+ "eval_loss": 0.5749590992927551,
63
+ "eval_recall_weighted": 0.8395309882747068,
64
+ "eval_runtime": 52.1038,
65
+ "eval_samples_per_second": 57.289,
66
+ "eval_steps_per_second": 1.804,
67
+ "step": 1000
68
+ },
69
+ {
70
+ "epoch": 2.0080321285140563,
71
+ "grad_norm": 2.8914544582366943,
72
+ "learning_rate": 4.284791965566714e-05,
73
+ "loss": 0.4007,
74
+ "step": 1500
75
+ },
76
+ {
77
+ "epoch": 2.0080321285140563,
78
+ "eval_accuracy": 0.8931323283082077,
79
+ "eval_f1_class_0": 0.96875,
80
+ "eval_f1_class_1": 0.7915492957746477,
81
+ "eval_f1_class_2": 0.8837209302325582,
82
+ "eval_f1_class_3": 0.838235294117647,
83
+ "eval_f1_class_4": 0.844574780058651,
84
+ "eval_f1_class_5": 0.9504,
85
+ "eval_f1_class_6": 0.9249617151607963,
86
+ "eval_f1_class_7": 0.9345794392523364,
87
+ "eval_f1_class_8": 0.9199999999999999,
88
+ "eval_f1_macro": 0.895196828288515,
89
+ "eval_f1_micro": 0.8931323283082077,
90
+ "eval_f1_weighted": 0.8935187314222036,
91
+ "eval_loss": 0.3943232595920563,
92
+ "eval_recall_weighted": 0.8931323283082077,
93
+ "eval_runtime": 52.1055,
94
+ "eval_samples_per_second": 57.288,
95
+ "eval_steps_per_second": 1.804,
96
+ "step": 1500
97
+ },
98
+ {
99
+ "epoch": 2.677376171352075,
100
+ "grad_norm": 2.264118194580078,
101
+ "learning_rate": 3.926111908177906e-05,
102
+ "loss": 0.2025,
103
+ "step": 2000
104
+ },
105
+ {
106
+ "epoch": 2.677376171352075,
107
+ "eval_accuracy": 0.9165829145728643,
108
+ "eval_f1_class_0": 0.9734789391575663,
109
+ "eval_f1_class_1": 0.8170563961485556,
110
+ "eval_f1_class_2": 0.9121338912133892,
111
+ "eval_f1_class_3": 0.910384068278805,
112
+ "eval_f1_class_4": 0.8715447154471545,
113
+ "eval_f1_class_5": 0.9562499999999999,
114
+ "eval_f1_class_6": 0.9147058823529411,
115
+ "eval_f1_class_7": 0.9559748427672956,
116
+ "eval_f1_class_8": 0.9525368248772503,
117
+ "eval_f1_macro": 0.918229506693662,
118
+ "eval_f1_micro": 0.9165829145728643,
119
+ "eval_f1_weighted": 0.9169458307013622,
120
+ "eval_loss": 0.392281711101532,
121
+ "eval_recall_weighted": 0.9165829145728643,
122
+ "eval_runtime": 52.1029,
123
+ "eval_samples_per_second": 57.29,
124
+ "eval_steps_per_second": 1.804,
125
+ "step": 2000
126
+ },
127
+ {
128
+ "epoch": 3.3467202141900936,
129
+ "grad_norm": 9.838397979736328,
130
+ "learning_rate": 3.5674318507890965e-05,
131
+ "loss": 0.1351,
132
+ "step": 2500
133
+ },
134
+ {
135
+ "epoch": 3.3467202141900936,
136
+ "eval_accuracy": 0.9252931323283082,
137
+ "eval_f1_class_0": 0.9750778816199377,
138
+ "eval_f1_class_1": 0.8636363636363636,
139
+ "eval_f1_class_2": 0.909814323607427,
140
+ "eval_f1_class_3": 0.8973607038123167,
141
+ "eval_f1_class_4": 0.8852459016393442,
142
+ "eval_f1_class_5": 0.9549839228295819,
143
+ "eval_f1_class_6": 0.9319526627218935,
144
+ "eval_f1_class_7": 0.9635499207606973,
145
+ "eval_f1_class_8": 0.9556962025316457,
146
+ "eval_f1_macro": 0.9263686536843565,
147
+ "eval_f1_micro": 0.9252931323283082,
148
+ "eval_f1_weighted": 0.9251223151765453,
149
+ "eval_loss": 0.38727396726608276,
150
+ "eval_recall_weighted": 0.9252931323283082,
151
+ "eval_runtime": 52.0796,
152
+ "eval_samples_per_second": 57.316,
153
+ "eval_steps_per_second": 1.805,
154
+ "step": 2500
155
+ },
156
+ {
157
+ "epoch": 4.016064257028113,
158
+ "grad_norm": 3.1932365894317627,
159
+ "learning_rate": 3.208751793400287e-05,
160
+ "loss": 0.1193,
161
+ "step": 3000
162
+ },
163
+ {
164
+ "epoch": 4.016064257028113,
165
+ "eval_accuracy": 0.9366834170854271,
166
+ "eval_f1_class_0": 0.9753086419753085,
167
+ "eval_f1_class_1": 0.8781954887218045,
168
+ "eval_f1_class_2": 0.9465020576131686,
169
+ "eval_f1_class_3": 0.8873626373626373,
170
+ "eval_f1_class_4": 0.9245283018867925,
171
+ "eval_f1_class_5": 0.9478672985781991,
172
+ "eval_f1_class_6": 0.948301329394387,
173
+ "eval_f1_class_7": 0.9695999999999999,
174
+ "eval_f1_class_8": 0.9602543720190778,
175
+ "eval_f1_macro": 0.9375466808390418,
176
+ "eval_f1_micro": 0.9366834170854271,
177
+ "eval_f1_weighted": 0.9367077203287543,
178
+ "eval_loss": 0.36861082911491394,
179
+ "eval_recall_weighted": 0.9366834170854271,
180
+ "eval_runtime": 52.0777,
181
+ "eval_samples_per_second": 57.318,
182
+ "eval_steps_per_second": 1.805,
183
+ "step": 3000
184
+ },
185
+ {
186
+ "epoch": 4.685408299866131,
187
+ "grad_norm": 16.49643325805664,
188
+ "learning_rate": 2.850071736011478e-05,
189
+ "loss": 0.063,
190
+ "step": 3500
191
+ },
192
+ {
193
+ "epoch": 4.685408299866131,
194
+ "eval_accuracy": 0.9396984924623115,
195
+ "eval_f1_class_0": 0.9751552795031054,
196
+ "eval_f1_class_1": 0.8555240793201134,
197
+ "eval_f1_class_2": 0.9222222222222223,
198
+ "eval_f1_class_3": 0.9184549356223176,
199
+ "eval_f1_class_4": 0.9200603318250377,
200
+ "eval_f1_class_5": 0.9730586370839936,
201
+ "eval_f1_class_6": 0.9650986342943855,
202
+ "eval_f1_class_7": 0.964968152866242,
203
+ "eval_f1_class_8": 0.9774193548387097,
204
+ "eval_f1_macro": 0.9413290697306808,
205
+ "eval_f1_micro": 0.9396984924623115,
206
+ "eval_f1_weighted": 0.9399337568761867,
207
+ "eval_loss": 0.3695576786994934,
208
+ "eval_recall_weighted": 0.9396984924623115,
209
+ "eval_runtime": 52.0778,
210
+ "eval_samples_per_second": 57.318,
211
+ "eval_steps_per_second": 1.805,
212
+ "step": 3500
213
+ }
214
+ ],
215
+ "logging_steps": 500,
216
+ "max_steps": 7470,
217
+ "num_input_tokens_seen": 0,
218
+ "num_train_epochs": 10,
219
+ "save_steps": 500,
220
+ "stateful_callbacks": {
221
+ "TrainerControl": {
222
+ "args": {
223
+ "should_epoch_stop": false,
224
+ "should_evaluate": false,
225
+ "should_log": false,
226
+ "should_save": true,
227
+ "should_training_stop": false
228
+ },
229
+ "attributes": {}
230
+ }
231
+ },
232
+ "total_flos": 1.47218650942464e+16,
233
+ "train_batch_size": 16,
234
+ "trial_name": null,
235
+ "trial_params": null
236
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ae381d8a4e60b845958278ae33592715df0c591a7af3c62d64bd55e46c5dd18
3
- size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41dd377079db2bb5319531916f5985e2f6d42d7d70265ab3bb800398e5955fc2
3
+ size 5048