jialicheng commited on
Commit
ddb8dab
·
verified ·
1 Parent(s): 588b6bd

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,69 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: cc-by-nc-4.0
3
+ base_model: MCG-NJU/videomae-large
4
+ tags:
5
+ - video-classification
6
+ - generated_from_trainer
7
+ metrics:
8
+ - accuracy
9
+ model-index:
10
+ - name: ucf101_42
11
+ results: []
12
+ ---
13
+
14
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
15
+ should probably proofread and complete it, then remove this comment. -->
16
+
17
+ # ucf101_42
18
+
19
+ This model is a fine-tuned version of [MCG-NJU/videomae-large](https://huggingface.co/MCG-NJU/videomae-large) on the ucf101 dataset.
20
+ It achieves the following results on the evaluation set:
21
+ - Loss: 0.3300
22
+ - Accuracy: 0.9256
23
+ - Test Accuracy: 0.9256
24
+ - Df Accuracy: 0.9239
25
+ - Unlearn Overall Accuracy: 0.5009
26
+ - Unlearn Time: 12868.6803
27
+
28
+ ## Model description
29
+
30
+ More information needed
31
+
32
+ ## Intended uses & limitations
33
+
34
+ More information needed
35
+
36
+ ## Training and evaluation data
37
+
38
+ More information needed
39
+
40
+ ## Training procedure
41
+
42
+ ### Training hyperparameters
43
+
44
+ The following hyperparameters were used during training:
45
+ - learning_rate: 5e-05
46
+ - train_batch_size: 4
47
+ - eval_batch_size: 32
48
+ - seed: 42
49
+ - gradient_accumulation_steps: 8
50
+ - total_train_batch_size: 32
51
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
52
+ - lr_scheduler_type: linear
53
+ - num_epochs: 3
54
+
55
+ ### Training results
56
+
57
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | Overall Accuracy | Unlearn Overall Accuracy | Time |
58
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:----------------:|:------------------------:|:----:|
59
+ | No log | 1.0 | 298 | 0.5062 | 0.9423 | 0.4680 | 0.4680 | -1 |
60
+ | No log | 2.0 | 596 | 0.3504 | 0.9423 | 0.4892 | 0.4892 | -1 |
61
+ | No log | 3.0 | 894 | 0.3300 | 0.9239 | 0.5009 | 0.5009 | -1 |
62
+
63
+
64
+ ### Framework versions
65
+
66
+ - Transformers 4.39.3
67
+ - Pytorch 2.2.2+cu118
68
+ - Datasets 2.18.0
69
+ - Tokenizers 0.15.2
all_results.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "df_accuracy": 0.9238754325259516,
3
+ "epoch": 3.0,
4
+ "eval_accuracy": 0.9255813953488372,
5
+ "eval_loss": 0.32996666431427,
6
+ "eval_runtime": 1084.2278,
7
+ "eval_samples_per_second": 3.489,
8
+ "eval_steps_per_second": 0.11,
9
+ "eval_unlearn_overall_accuracy": 0.5008529814114429,
10
+ "ood_accuracy": 0.28085263222556667,
11
+ "ood_loss": 3.7067184448242188,
12
+ "ood_runtime": 1654.1823,
13
+ "ood_samples_per_second": 2.823,
14
+ "ood_steps_per_second": 0.044,
15
+ "test_accuracy": 0.9255813953488372,
16
+ "train_accuracy": 0.9960578186596584,
17
+ "train_loss": 0.05140041187405586,
18
+ "train_runtime": 158.7372,
19
+ "train_samples_per_second": 3.818,
20
+ "train_steps_per_second": 0.12,
21
+ "unlearn_overall_accuracy": 0.5008529814114429,
22
+ "unlearn_time": 12868.680254936218
23
+ }
config.json ADDED
@@ -0,0 +1,237 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "./video/train/checkpoint/videomae-large/ucf101_42",
3
+ "architectures": [
4
+ "VideoMAEForVideoClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "decoder_hidden_size": 512,
8
+ "decoder_intermediate_size": 2048,
9
+ "decoder_num_attention_heads": 8,
10
+ "decoder_num_hidden_layers": 12,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.0,
13
+ "hidden_size": 1024,
14
+ "id2label": {
15
+ "0": "ApplyEyeMakeup",
16
+ "1": "ApplyLipstick",
17
+ "2": "Archery",
18
+ "3": "BabyCrawling",
19
+ "4": "BalanceBeam",
20
+ "5": "BandMarching",
21
+ "6": "BaseballPitch",
22
+ "7": "Basketball",
23
+ "8": "BasketballDunk",
24
+ "9": "BenchPress",
25
+ "10": "Biking",
26
+ "11": "Billiards",
27
+ "12": "BlowDryHair",
28
+ "13": "BlowingCandles",
29
+ "14": "BodyWeightSquats",
30
+ "15": "Bowling",
31
+ "16": "BoxingPunchingBag",
32
+ "17": "BoxingSpeedBag",
33
+ "18": "BreastStroke",
34
+ "19": "BrushingTeeth",
35
+ "20": "CleanAndJerk",
36
+ "21": "CliffDiving",
37
+ "22": "CricketBowling",
38
+ "23": "CricketShot",
39
+ "24": "CuttingInKitchen",
40
+ "25": "Diving",
41
+ "26": "Drumming",
42
+ "27": "Fencing",
43
+ "28": "FieldHockeyPenalty",
44
+ "29": "FloorGymnastics",
45
+ "30": "FrisbeeCatch",
46
+ "31": "FrontCrawl",
47
+ "32": "GolfSwing",
48
+ "33": "Haircut",
49
+ "34": "Hammering",
50
+ "35": "HammerThrow",
51
+ "36": "HandstandPushups",
52
+ "37": "HandstandWalking",
53
+ "38": "HeadMassage",
54
+ "39": "HighJump",
55
+ "40": "HorseRace",
56
+ "41": "HorseRiding",
57
+ "42": "HulaHoop",
58
+ "43": "IceDancing",
59
+ "44": "JavelinThrow",
60
+ "45": "JugglingBalls",
61
+ "46": "JumpingJack",
62
+ "47": "JumpRope",
63
+ "48": "Kayaking",
64
+ "49": "Knitting",
65
+ "50": "LongJump",
66
+ "51": "Lunges",
67
+ "52": "MilitaryParade",
68
+ "53": "Mixing",
69
+ "54": "MoppingFloor",
70
+ "55": "Nunchucks",
71
+ "56": "ParallelBars",
72
+ "57": "PizzaTossing",
73
+ "58": "PlayingCello",
74
+ "59": "PlayingDaf",
75
+ "60": "PlayingDhol",
76
+ "61": "PlayingFlute",
77
+ "62": "PlayingGuitar",
78
+ "63": "PlayingPiano",
79
+ "64": "PlayingSitar",
80
+ "65": "PlayingTabla",
81
+ "66": "PlayingViolin",
82
+ "67": "PoleVault",
83
+ "68": "PommelHorse",
84
+ "69": "PullUps",
85
+ "70": "Punch",
86
+ "71": "PushUps",
87
+ "72": "Rafting",
88
+ "73": "RockClimbingIndoor",
89
+ "74": "RopeClimbing",
90
+ "75": "Rowing",
91
+ "76": "SalsaSpin",
92
+ "77": "ShavingBeard",
93
+ "78": "Shotput",
94
+ "79": "SkateBoarding",
95
+ "80": "Skiing",
96
+ "81": "Skijet",
97
+ "82": "SkyDiving",
98
+ "83": "SoccerJuggling",
99
+ "84": "SoccerPenalty",
100
+ "85": "StillRings",
101
+ "86": "SumoWrestling",
102
+ "87": "Surfing",
103
+ "88": "Swing",
104
+ "89": "TableTennisShot",
105
+ "90": "TaiChi",
106
+ "91": "TennisSwing",
107
+ "92": "ThrowDiscus",
108
+ "93": "TrampolineJumping",
109
+ "94": "Typing",
110
+ "95": "UnevenBars",
111
+ "96": "VolleyballSpiking",
112
+ "97": "WalkingWithDog",
113
+ "98": "WallPushups",
114
+ "99": "WritingOnBoard",
115
+ "100": "YoYo"
116
+ },
117
+ "image_size": 224,
118
+ "initializer_range": 0.02,
119
+ "intermediate_size": 4096,
120
+ "label2id": {
121
+ "ApplyEyeMakeup": 0,
122
+ "ApplyLipstick": 1,
123
+ "Archery": 2,
124
+ "BabyCrawling": 3,
125
+ "BalanceBeam": 4,
126
+ "BandMarching": 5,
127
+ "BaseballPitch": 6,
128
+ "Basketball": 7,
129
+ "BasketballDunk": 8,
130
+ "BenchPress": 9,
131
+ "Biking": 10,
132
+ "Billiards": 11,
133
+ "BlowDryHair": 12,
134
+ "BlowingCandles": 13,
135
+ "BodyWeightSquats": 14,
136
+ "Bowling": 15,
137
+ "BoxingPunchingBag": 16,
138
+ "BoxingSpeedBag": 17,
139
+ "BreastStroke": 18,
140
+ "BrushingTeeth": 19,
141
+ "CleanAndJerk": 20,
142
+ "CliffDiving": 21,
143
+ "CricketBowling": 22,
144
+ "CricketShot": 23,
145
+ "CuttingInKitchen": 24,
146
+ "Diving": 25,
147
+ "Drumming": 26,
148
+ "Fencing": 27,
149
+ "FieldHockeyPenalty": 28,
150
+ "FloorGymnastics": 29,
151
+ "FrisbeeCatch": 30,
152
+ "FrontCrawl": 31,
153
+ "GolfSwing": 32,
154
+ "Haircut": 33,
155
+ "HammerThrow": 35,
156
+ "Hammering": 34,
157
+ "HandstandPushups": 36,
158
+ "HandstandWalking": 37,
159
+ "HeadMassage": 38,
160
+ "HighJump": 39,
161
+ "HorseRace": 40,
162
+ "HorseRiding": 41,
163
+ "HulaHoop": 42,
164
+ "IceDancing": 43,
165
+ "JavelinThrow": 44,
166
+ "JugglingBalls": 45,
167
+ "JumpRope": 47,
168
+ "JumpingJack": 46,
169
+ "Kayaking": 48,
170
+ "Knitting": 49,
171
+ "LongJump": 50,
172
+ "Lunges": 51,
173
+ "MilitaryParade": 52,
174
+ "Mixing": 53,
175
+ "MoppingFloor": 54,
176
+ "Nunchucks": 55,
177
+ "ParallelBars": 56,
178
+ "PizzaTossing": 57,
179
+ "PlayingCello": 58,
180
+ "PlayingDaf": 59,
181
+ "PlayingDhol": 60,
182
+ "PlayingFlute": 61,
183
+ "PlayingGuitar": 62,
184
+ "PlayingPiano": 63,
185
+ "PlayingSitar": 64,
186
+ "PlayingTabla": 65,
187
+ "PlayingViolin": 66,
188
+ "PoleVault": 67,
189
+ "PommelHorse": 68,
190
+ "PullUps": 69,
191
+ "Punch": 70,
192
+ "PushUps": 71,
193
+ "Rafting": 72,
194
+ "RockClimbingIndoor": 73,
195
+ "RopeClimbing": 74,
196
+ "Rowing": 75,
197
+ "SalsaSpin": 76,
198
+ "ShavingBeard": 77,
199
+ "Shotput": 78,
200
+ "SkateBoarding": 79,
201
+ "Skiing": 80,
202
+ "Skijet": 81,
203
+ "SkyDiving": 82,
204
+ "SoccerJuggling": 83,
205
+ "SoccerPenalty": 84,
206
+ "StillRings": 85,
207
+ "SumoWrestling": 86,
208
+ "Surfing": 87,
209
+ "Swing": 88,
210
+ "TableTennisShot": 89,
211
+ "TaiChi": 90,
212
+ "TennisSwing": 91,
213
+ "ThrowDiscus": 92,
214
+ "TrampolineJumping": 93,
215
+ "Typing": 94,
216
+ "UnevenBars": 95,
217
+ "VolleyballSpiking": 96,
218
+ "WalkingWithDog": 97,
219
+ "WallPushups": 98,
220
+ "WritingOnBoard": 99,
221
+ "YoYo": 100
222
+ },
223
+ "layer_norm_eps": 1e-12,
224
+ "model_type": "videomae",
225
+ "norm_pix_loss": true,
226
+ "num_attention_heads": 16,
227
+ "num_channels": 3,
228
+ "num_frames": 16,
229
+ "num_hidden_layers": 24,
230
+ "patch_size": 16,
231
+ "problem_type": "single_label_classification",
232
+ "qkv_bias": true,
233
+ "torch_dtype": "float32",
234
+ "transformers_version": "4.39.3",
235
+ "tubelet_size": 2,
236
+ "use_mean_pooling": false
237
+ }
dr_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "train_accuracy": 0.9960578186596584,
4
+ "train_loss": 0.05140041187405586,
5
+ "train_runtime": 158.7372,
6
+ "train_samples_per_second": 3.818,
7
+ "train_steps_per_second": 0.12
8
+ }
eval_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "df_accuracy": 0.9238754325259516,
3
+ "epoch": 3.0,
4
+ "eval_accuracy": 0.9255813953488372,
5
+ "eval_loss": 0.32996666431427,
6
+ "eval_runtime": 1084.2278,
7
+ "eval_samples_per_second": 3.489,
8
+ "eval_steps_per_second": 0.11,
9
+ "eval_unlearn_overall_accuracy": 0.5008529814114429,
10
+ "test_accuracy": 0.9255813953488372,
11
+ "unlearn_overall_accuracy": 0.5008529814114429,
12
+ "unlearn_time": 12868.680254936218
13
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e28fa715846af8f54a286a432fb53664578d563b9d871b17573c04f41424cb59
3
+ size 1215902164
ood_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "ood_accuracy": 0.28085263222556667,
3
+ "ood_loss": 3.7067184448242188,
4
+ "ood_runtime": 1654.1823,
5
+ "ood_samples_per_second": 2.823,
6
+ "ood_steps_per_second": 0.044
7
+ }
pred_logit_df.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:437dabd7b3d1e5132ae41f3e2bf1d15699750218d78212f58d96f1afa6c6e458
3
+ size 700664
pred_logit_eval.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0bd9ff9c8134d80220e37ae34198a2b1c852655a036f2d643cd16e31899f219
3
+ size 4343128
pred_logit_ood.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3150d21dfe8b68a14e9d7f59450fbbf41220f980bb841d9d00d6e975b3090174
3
+ size 6576844
pred_logit_train.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf0eb0a47dfaf92d337dba5f989bcc2deeac6cfea8ed7f17eb9aec09863a9728
3
+ size 615016
preprocessor_config.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_valid_processor_keys": [
3
+ "videos",
4
+ "do_resize",
5
+ "size",
6
+ "resample",
7
+ "do_center_crop",
8
+ "crop_size",
9
+ "do_rescale",
10
+ "rescale_factor",
11
+ "do_normalize",
12
+ "image_mean",
13
+ "image_std",
14
+ "return_tensors",
15
+ "data_format",
16
+ "input_data_format"
17
+ ],
18
+ "crop_size": {
19
+ "height": 224,
20
+ "width": 224
21
+ },
22
+ "do_center_crop": true,
23
+ "do_normalize": true,
24
+ "do_rescale": true,
25
+ "do_resize": true,
26
+ "image_mean": [
27
+ 0.485,
28
+ 0.456,
29
+ 0.406
30
+ ],
31
+ "image_processor_type": "VideoMAEImageProcessor",
32
+ "image_std": [
33
+ 0.229,
34
+ 0.224,
35
+ 0.225
36
+ ],
37
+ "resample": 2,
38
+ "rescale_factor": 0.00392156862745098,
39
+ "size": {
40
+ "shortest_edge": 224
41
+ }
42
+ }
test_results.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "df_accuracy": 0.9238754325259516,
3
+ "epoch": 3.0,
4
+ "eval_accuracy": 0.9255813953488372,
5
+ "eval_loss": 0.32996666431427,
6
+ "eval_runtime": 1084.2278,
7
+ "eval_samples_per_second": 3.489,
8
+ "eval_steps_per_second": 0.11,
9
+ "eval_unlearn_overall_accuracy": 0.5008529814114429,
10
+ "test_accuracy": 0.9255813953488372,
11
+ "unlearn_overall_accuracy": 0.5008529814114429,
12
+ "unlearn_time": 12868.680254936218
13
+ }
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "train_loss": 0.3672076743721162,
4
+ "train_runtime": 12868.4593,
5
+ "train_samples_per_second": 2.223,
6
+ "train_steps_per_second": 0.069
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5008529814114429,
3
+ "best_model_checkpoint": "video/unlearn/checkpoint/videomae-large/random_label/6.0/ucf101_42/checkpoint-894",
4
+ "epoch": 2.99874213836478,
5
+ "eval_steps": 500,
6
+ "global_step": 894,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "df_accuracy": 0.9423298731257209,
13
+ "epoch": 1.0,
14
+ "eval_accuracy": 0.8782325581395349,
15
+ "eval_loss": 0.5061985850334167,
16
+ "eval_runtime": 1143.4036,
17
+ "eval_samples_per_second": 3.309,
18
+ "eval_steps_per_second": 0.104,
19
+ "eval_unlearn_overall_accuracy": 0.467951342506907,
20
+ "step": 298,
21
+ "test_accuracy": 0.8782325581395349,
22
+ "unlearn_overall_accuracy": 0.467951342506907,
23
+ "unlearn_time": -1
24
+ },
25
+ {
26
+ "df_accuracy": 0.9423298731257209,
27
+ "epoch": 2.0,
28
+ "eval_accuracy": 0.9206511627906977,
29
+ "eval_loss": 0.3504374623298645,
30
+ "eval_runtime": 1085.58,
31
+ "eval_samples_per_second": 3.485,
32
+ "eval_steps_per_second": 0.11,
33
+ "eval_unlearn_overall_accuracy": 0.4891606448324884,
34
+ "step": 596,
35
+ "test_accuracy": 0.9206511627906977,
36
+ "unlearn_overall_accuracy": 0.4891606448324884,
37
+ "unlearn_time": -1
38
+ },
39
+ {
40
+ "df_accuracy": 0.9238754325259516,
41
+ "epoch": 3.0,
42
+ "eval_accuracy": 0.9255813953488372,
43
+ "eval_loss": 0.32996666431427,
44
+ "eval_runtime": 1087.6553,
45
+ "eval_samples_per_second": 3.478,
46
+ "eval_steps_per_second": 0.109,
47
+ "eval_unlearn_overall_accuracy": 0.5008529814114429,
48
+ "step": 894,
49
+ "test_accuracy": 0.9255813953488372,
50
+ "unlearn_overall_accuracy": 0.5008529814114429,
51
+ "unlearn_time": -1
52
+ },
53
+ {
54
+ "epoch": 3.0,
55
+ "step": 894,
56
+ "total_flos": 1.2563407617283857e+20,
57
+ "train_loss": 0.3672076743721162,
58
+ "train_runtime": 12868.4593,
59
+ "train_samples_per_second": 2.223,
60
+ "train_steps_per_second": 0.069
61
+ }
62
+ ],
63
+ "logging_steps": 1000,
64
+ "max_steps": 894,
65
+ "num_input_tokens_seen": 0,
66
+ "num_train_epochs": 3,
67
+ "save_steps": 500,
68
+ "total_flos": 1.2563407617283857e+20,
69
+ "train_batch_size": 4,
70
+ "trial_name": null,
71
+ "trial_params": null
72
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c3c0cb0ddd081f69db27f9d937e6c95606568e748f49f9b96dc3904edd5f392
3
+ size 5112