kpeng-05 commited on
Commit
58bc184
·
verified ·
1 Parent(s): b2bcf49

Upload 9 files

Browse files
config.json ADDED
@@ -0,0 +1,79 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "microsoft/beit-base-patch16-224",
3
+ "add_fpn": false,
4
+ "architectures": [
5
+ "BeitForImageClassification"
6
+ ],
7
+ "attention_probs_dropout_prob": 0.0,
8
+ "auxiliary_channels": 256,
9
+ "auxiliary_concat_input": false,
10
+ "auxiliary_loss_weight": 0.4,
11
+ "auxiliary_num_convs": 1,
12
+ "drop_path_rate": 0.1,
13
+ "hidden_act": "gelu",
14
+ "hidden_dropout_prob": 0.0,
15
+ "hidden_size": 768,
16
+ "id2label": {
17
+ "0": "faceswap",
18
+ "1": "real",
19
+ "2": "sfhq",
20
+ "3": "stable_diffusion",
21
+ "4": "thispersondoesnotexist"
22
+ },
23
+ "image_size": 224,
24
+ "initializer_range": 0.02,
25
+ "intermediate_size": 3072,
26
+ "label2id": {
27
+ "faceswap": 0,
28
+ "real": 1,
29
+ "sfhq": 2,
30
+ "stable_diffusion": 3,
31
+ "thispersondoesnotexist": 4
32
+ },
33
+ "layer_norm_eps": 1e-12,
34
+ "layer_scale_init_value": 0.1,
35
+ "model_type": "beit",
36
+ "num_attention_heads": 12,
37
+ "num_channels": 3,
38
+ "num_hidden_layers": 12,
39
+ "out_features": [
40
+ "stage12"
41
+ ],
42
+ "out_indices": [
43
+ 12
44
+ ],
45
+ "patch_size": 16,
46
+ "pool_scales": [
47
+ 1,
48
+ 2,
49
+ 3,
50
+ 6
51
+ ],
52
+ "problem_type": "single_label_classification",
53
+ "reshape_hidden_states": true,
54
+ "semantic_loss_ignore_index": 255,
55
+ "stage_names": [
56
+ "stem",
57
+ "stage1",
58
+ "stage2",
59
+ "stage3",
60
+ "stage4",
61
+ "stage5",
62
+ "stage6",
63
+ "stage7",
64
+ "stage8",
65
+ "stage9",
66
+ "stage10",
67
+ "stage11",
68
+ "stage12"
69
+ ],
70
+ "torch_dtype": "float32",
71
+ "transformers_version": "4.48.2",
72
+ "use_absolute_position_embeddings": false,
73
+ "use_auxiliary_head": true,
74
+ "use_mask_token": false,
75
+ "use_mean_pooling": true,
76
+ "use_relative_position_bias": true,
77
+ "use_shared_relative_position_bias": false,
78
+ "vocab_size": 8192
79
+ }
gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:091dfb9ee437c743f08996c35e9a85b50dea43c4f2c08d1749f43b6a722e0f74
3
+ size 343089556
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76f32410aad2b8fde67664100ba77b9206b7829ac98f873c32fd25ed980430bc
3
+ size 686313082
preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": false,
7
+ "do_normalize": true,
8
+ "do_reduce_labels": false,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.5,
13
+ 0.5,
14
+ 0.5
15
+ ],
16
+ "image_processor_type": "BeitFeatureExtractor",
17
+ "image_std": [
18
+ 0.5,
19
+ 0.5,
20
+ 0.5
21
+ ],
22
+ "resample": 2,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "height": 224,
26
+ "width": 224
27
+ }
28
+ }
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30802ee6b802cf0755cac9a204b064ca9c552516d1e85cb6072aafc4ac576b5a
3
+ size 14244
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14508328767fb35b822b09b625b1477a4ecbcb3c4dd224dd08a15bd502df0d95
3
+ size 1064
trainer_state.json ADDED
@@ -0,0 +1,242 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9493333333333334,
3
+ "best_model_checkpoint": "./beit_finetuned\\checkpoint-1314",
4
+ "epoch": 3.0,
5
+ "eval_steps": 500,
6
+ "global_step": 1314,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.1141552511415525,
13
+ "grad_norm": 8.857061386108398,
14
+ "learning_rate": 4.8173515981735164e-05,
15
+ "loss": 1.0756,
16
+ "step": 50
17
+ },
18
+ {
19
+ "epoch": 0.228310502283105,
20
+ "grad_norm": 6.956742286682129,
21
+ "learning_rate": 4.6270928462709285e-05,
22
+ "loss": 0.8313,
23
+ "step": 100
24
+ },
25
+ {
26
+ "epoch": 0.3424657534246575,
27
+ "grad_norm": 25.718080520629883,
28
+ "learning_rate": 4.452054794520548e-05,
29
+ "loss": 0.7164,
30
+ "step": 150
31
+ },
32
+ {
33
+ "epoch": 0.45662100456621,
34
+ "grad_norm": 14.741324424743652,
35
+ "learning_rate": 4.26179604261796e-05,
36
+ "loss": 0.6739,
37
+ "step": 200
38
+ },
39
+ {
40
+ "epoch": 0.5707762557077626,
41
+ "grad_norm": 8.193249702453613,
42
+ "learning_rate": 4.071537290715373e-05,
43
+ "loss": 0.6212,
44
+ "step": 250
45
+ },
46
+ {
47
+ "epoch": 0.684931506849315,
48
+ "grad_norm": 18.06510353088379,
49
+ "learning_rate": 3.881278538812785e-05,
50
+ "loss": 0.4952,
51
+ "step": 300
52
+ },
53
+ {
54
+ "epoch": 0.7990867579908676,
55
+ "grad_norm": 8.87159252166748,
56
+ "learning_rate": 3.691019786910198e-05,
57
+ "loss": 0.4409,
58
+ "step": 350
59
+ },
60
+ {
61
+ "epoch": 0.91324200913242,
62
+ "grad_norm": 2.9289777278900146,
63
+ "learning_rate": 3.50076103500761e-05,
64
+ "loss": 0.4377,
65
+ "step": 400
66
+ },
67
+ {
68
+ "epoch": 1.0,
69
+ "eval_accuracy": 0.8773333333333333,
70
+ "eval_loss": 0.36529314517974854,
71
+ "eval_runtime": 83.9644,
72
+ "eval_samples_per_second": 17.865,
73
+ "eval_steps_per_second": 1.12,
74
+ "step": 438
75
+ },
76
+ {
77
+ "epoch": 1.0273972602739727,
78
+ "grad_norm": 1.1098586320877075,
79
+ "learning_rate": 3.310502283105023e-05,
80
+ "loss": 0.2894,
81
+ "step": 450
82
+ },
83
+ {
84
+ "epoch": 1.1415525114155252,
85
+ "grad_norm": 17.91949462890625,
86
+ "learning_rate": 3.120243531202435e-05,
87
+ "loss": 0.2204,
88
+ "step": 500
89
+ },
90
+ {
91
+ "epoch": 1.2557077625570776,
92
+ "grad_norm": 3.071772575378418,
93
+ "learning_rate": 2.929984779299848e-05,
94
+ "loss": 0.1716,
95
+ "step": 550
96
+ },
97
+ {
98
+ "epoch": 1.36986301369863,
99
+ "grad_norm": 1.6142654418945312,
100
+ "learning_rate": 2.7397260273972603e-05,
101
+ "loss": 0.1754,
102
+ "step": 600
103
+ },
104
+ {
105
+ "epoch": 1.4840182648401825,
106
+ "grad_norm": 25.471872329711914,
107
+ "learning_rate": 2.549467275494673e-05,
108
+ "loss": 0.2025,
109
+ "step": 650
110
+ },
111
+ {
112
+ "epoch": 1.5981735159817352,
113
+ "grad_norm": 3.1595094203948975,
114
+ "learning_rate": 2.359208523592085e-05,
115
+ "loss": 0.2487,
116
+ "step": 700
117
+ },
118
+ {
119
+ "epoch": 1.7123287671232876,
120
+ "grad_norm": 3.188368797302246,
121
+ "learning_rate": 2.1689497716894976e-05,
122
+ "loss": 0.1964,
123
+ "step": 750
124
+ },
125
+ {
126
+ "epoch": 1.82648401826484,
127
+ "grad_norm": 0.5533382296562195,
128
+ "learning_rate": 1.97869101978691e-05,
129
+ "loss": 0.109,
130
+ "step": 800
131
+ },
132
+ {
133
+ "epoch": 1.9406392694063928,
134
+ "grad_norm": 15.678669929504395,
135
+ "learning_rate": 1.7884322678843227e-05,
136
+ "loss": 0.1221,
137
+ "step": 850
138
+ },
139
+ {
140
+ "epoch": 2.0,
141
+ "eval_accuracy": 0.8986666666666666,
142
+ "eval_loss": 0.3740909695625305,
143
+ "eval_runtime": 85.0571,
144
+ "eval_samples_per_second": 17.635,
145
+ "eval_steps_per_second": 1.105,
146
+ "step": 876
147
+ },
148
+ {
149
+ "epoch": 2.0547945205479454,
150
+ "grad_norm": 5.463280200958252,
151
+ "learning_rate": 1.5981735159817352e-05,
152
+ "loss": 0.1046,
153
+ "step": 900
154
+ },
155
+ {
156
+ "epoch": 2.1689497716894977,
157
+ "grad_norm": 14.793232917785645,
158
+ "learning_rate": 1.4079147640791476e-05,
159
+ "loss": 0.0534,
160
+ "step": 950
161
+ },
162
+ {
163
+ "epoch": 2.2831050228310503,
164
+ "grad_norm": 5.250246524810791,
165
+ "learning_rate": 1.2176560121765601e-05,
166
+ "loss": 0.02,
167
+ "step": 1000
168
+ },
169
+ {
170
+ "epoch": 2.3972602739726026,
171
+ "grad_norm": 22.0667667388916,
172
+ "learning_rate": 1.0273972602739726e-05,
173
+ "loss": 0.0274,
174
+ "step": 1050
175
+ },
176
+ {
177
+ "epoch": 2.5114155251141552,
178
+ "grad_norm": 4.051002025604248,
179
+ "learning_rate": 8.37138508371385e-06,
180
+ "loss": 0.0312,
181
+ "step": 1100
182
+ },
183
+ {
184
+ "epoch": 2.625570776255708,
185
+ "grad_norm": 1.257653832435608,
186
+ "learning_rate": 6.468797564687975e-06,
187
+ "loss": 0.0213,
188
+ "step": 1150
189
+ },
190
+ {
191
+ "epoch": 2.73972602739726,
192
+ "grad_norm": 3.783207654953003,
193
+ "learning_rate": 4.566210045662101e-06,
194
+ "loss": 0.0392,
195
+ "step": 1200
196
+ },
197
+ {
198
+ "epoch": 2.853881278538813,
199
+ "grad_norm": 0.03894606605172157,
200
+ "learning_rate": 2.663622526636225e-06,
201
+ "loss": 0.0378,
202
+ "step": 1250
203
+ },
204
+ {
205
+ "epoch": 2.968036529680365,
206
+ "grad_norm": 10.792261123657227,
207
+ "learning_rate": 7.610350076103501e-07,
208
+ "loss": 0.0187,
209
+ "step": 1300
210
+ },
211
+ {
212
+ "epoch": 3.0,
213
+ "eval_accuracy": 0.9493333333333334,
214
+ "eval_loss": 0.18020151555538177,
215
+ "eval_runtime": 85.2028,
216
+ "eval_samples_per_second": 17.605,
217
+ "eval_steps_per_second": 1.103,
218
+ "step": 1314
219
+ }
220
+ ],
221
+ "logging_steps": 50,
222
+ "max_steps": 1314,
223
+ "num_input_tokens_seen": 0,
224
+ "num_train_epochs": 3,
225
+ "save_steps": 500,
226
+ "stateful_callbacks": {
227
+ "TrainerControl": {
228
+ "args": {
229
+ "should_epoch_stop": false,
230
+ "should_evaluate": false,
231
+ "should_log": false,
232
+ "should_save": true,
233
+ "should_training_stop": true
234
+ },
235
+ "attributes": {}
236
+ }
237
+ },
238
+ "total_flos": 1.626679997171712e+18,
239
+ "train_batch_size": 16,
240
+ "trial_name": null,
241
+ "trial_params": null
242
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21e3ab9073c6fce128dd434fb3b9b5ac50875b385a6cdc19b22dc10901a6b90a
3
+ size 5304