manh6054 commited on
Commit
6c394ec
·
verified ·
1 Parent(s): c3b7049

Upload 160 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. ava/CBAM/config.yaml +370 -0
  2. ava/CBAM/ema_epoch_1.pth +3 -0
  3. ava/CBAM/ema_epoch_2.pth +3 -0
  4. ava/CBAM/ema_epoch_3.pth +3 -0
  5. ava/CBAM/ema_epoch_4.pth +3 -0
  6. ava/CBAM/ema_epoch_5.pth +3 -0
  7. ava/CBAM/ema_epoch_6.pth +3 -0
  8. ava/CBAM/ema_epoch_7.pth +3 -0
  9. ava/CBAM/ema_epoch_8.pth +3 -0
  10. ava/CBAM/ema_epoch_9.pth +3 -0
  11. ava/CBAM/epoch_1.pth +3 -0
  12. ava/CBAM/epoch_2.pth +3 -0
  13. ava/CBAM/epoch_3.pth +3 -0
  14. ava/CBAM/epoch_4.pth +3 -0
  15. ava/CBAM/epoch_5.pth +3 -0
  16. ava/CBAM/epoch_6.pth +3 -0
  17. ava/CBAM/epoch_7.pth +3 -0
  18. ava/CBAM/epoch_8.pth +3 -0
  19. ava/CBAM/epoch_9.pth +3 -0
  20. ava/CBAM/logging.txt +1 -0
  21. ava/Channel/config.yaml +381 -0
  22. ava/Channel/ema_epoch_1.pth +3 -0
  23. ava/Channel/ema_epoch_2.pth +3 -0
  24. ava/Channel/ema_epoch_3.pth +3 -0
  25. ava/Channel/ema_epoch_4.pth +3 -0
  26. ava/Channel/ema_epoch_5.pth +3 -0
  27. ava/Channel/ema_epoch_6.pth +3 -0
  28. ava/Channel/ema_epoch_7.pth +3 -0
  29. ava/Channel/ema_epoch_8.pth +3 -0
  30. ava/Channel/ema_epoch_9.pth +3 -0
  31. ava/Channel/epoch_1.pth +3 -0
  32. ava/Channel/epoch_2.pth +3 -0
  33. ava/Channel/epoch_3.pth +3 -0
  34. ava/Channel/epoch_4.pth +3 -0
  35. ava/Channel/epoch_5.pth +3 -0
  36. ava/Channel/epoch_6.pth +3 -0
  37. ava/Channel/epoch_7.pth +3 -0
  38. ava/Channel/epoch_8.pth +3 -0
  39. ava/Channel/epoch_9.pth +3 -0
  40. ava/Channel/logging.txt +1 -0
  41. ava/LKA/config.yaml +381 -0
  42. ava/LKA/ema_epoch_1.pth +3 -0
  43. ava/LKA/ema_epoch_2.pth +3 -0
  44. ava/LKA/ema_epoch_3.pth +3 -0
  45. ava/LKA/ema_epoch_4.pth +3 -0
  46. ava/LKA/ema_epoch_5.pth +3 -0
  47. ava/LKA/ema_epoch_6.pth +3 -0
  48. ava/LKA/ema_epoch_7.pth +3 -0
  49. ava/LKA/ema_epoch_8.pth +3 -0
  50. ava/LKA/ema_epoch_9.pth +3 -0
ava/CBAM/config.yaml ADDED
@@ -0,0 +1,370 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BACKBONE2D:
2
+ YOLOv8:
3
+ ver : m
4
+
5
+ PRETRAIN:
6
+ n : weights/backbone2D/YOLOv8/v8_n.pth
7
+ s : weights/backbone2D/YOLOv8/v8_s.pth
8
+ m : weights/backbone2D/YOLOv8/v8_m.pth
9
+ l : weights/backbone2D/YOLOv8/v8_l.pth
10
+ x : weights/backbone2D/YOLOv8/v8_x.pth
11
+
12
+ BACKBONE3D:
13
+
14
+ MOBILENET:
15
+ width_mult: 2.0
16
+
17
+ PRETRAIN:
18
+ width_mult_0.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_0.5x_RGB_16_best.pth
19
+ width_mult_1.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.0x_RGB_16_best.pth
20
+ width_mult_1.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.5x_RGB_16_best.pth
21
+ width_mult_2.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_2.0x_RGB_16_best.pth
22
+
23
+ MOBILENETv2:
24
+ width_mult: 1.0
25
+
26
+ PRETRAIN:
27
+ width_mult_0.2x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.2x_RGB_16_best.pth
28
+ width_mult_0.45x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.45x_RGB_16_best.pth
29
+ width_mult_0.7x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.7x_RGB_16_best.pth
30
+ width_mult_1.0x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_1.0x_RGB_16_best.pth
31
+
32
+ SHUFFLENET:
33
+ width_mult: 2.0
34
+
35
+ PRETRAIN:
36
+ width_mult_0.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_0.5x_G3_RGB_16_best.pth
37
+ width_mult_1.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.0x_G3_RGB_16_best.pth
38
+ width_mult_1.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.5x_G3_RGB_16_best.pth
39
+ width_mult_2.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_2.0x_G3_RGB_16_best.pth
40
+
41
+ SHUFFLENETv2:
42
+ width_mult: 2.0
43
+
44
+ PRETRAIN:
45
+ width_mult_0.25x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_0.25x_RGB_16_best.pth
46
+ width_mult_1.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.0x_RGB_16_best.pth
47
+ width_mult_1.5x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.5x_RGB_16_best.pth
48
+ width_mult_2.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_2.0x_RGB_16_best.pth
49
+
50
+ I3D:
51
+ PRETRAIN:
52
+ default: weights/backbone3D/I3D/rgb_imagenet.pth
53
+
54
+ RESNET:
55
+ ver : 101
56
+
57
+ PRETRAIN:
58
+ ver_18 : weights/backbone3D/resnet/kinetics_resnet_18_RGB_16_best.pth
59
+ ver_50 : weights/backbone3D/resnet/kinetics_resnet_50_RGB_16_best.pth
60
+ ver_101: weights/backbone3D/resnet/kinetics_resnet_101_RGB_16_best.pth
61
+
62
+ RESNEXT:
63
+ ver : 101
64
+
65
+ PRETRAIN:
66
+ ver_101 : weights/backbone3D/resnext/resnext-101-kinetics.pth
67
+
68
+ LOSS:
69
+ TAL:
70
+ top_k : 10
71
+ alpha : 0.5
72
+ beta : 6.0
73
+ radius : 2.5
74
+ soft_label : False
75
+
76
+ scale_cls_loss : 0.5
77
+ scale_box_loss : 7.5
78
+ scale_dfl_loss : 1.5
79
+
80
+ SIMOTA:
81
+ top_k : 10
82
+ gamma : 0.5
83
+ radius : 2.5
84
+ mode : unbalance
85
+ soft_label : True
86
+
87
+ dynamic_k : False
88
+ dynamic_top_k : 10
89
+
90
+ scale_cls_loss : 0.5
91
+ scale_box_loss : 5.0
92
+ scale_dfl_loss : 0.5
93
+
94
+ config_path : config/cf/ava.yaml
95
+ dataset : ava
96
+ loss : simota
97
+ active_checker : True
98
+ num_classes : 80
99
+ backbone2D : yolov8
100
+ backbone3D : i3d
101
+ fusion_module : CBAM
102
+ mode : decoupled
103
+ interchannels : [256, 256, 256]
104
+ pretrain_path : weights/fig1/ava/CBAM/ema_epoch_8.pth
105
+ data_root : /home/manh/Datasets/ava
106
+ img_size : 224
107
+ clip_length : 16
108
+ batch_size : 8
109
+ num_workers : 6
110
+ acc_grad : 16
111
+ lr : 0.0001
112
+ weight_decay : 0.0005
113
+ max_step_warmup : 500
114
+ adjustlr_schedule : [3, 4, 5, 6]
115
+ max_epoch : 9
116
+ lr_decay : 0.5
117
+ save_folder : weights/fig1/ava/CBAM
118
+ sampling_rate : 1
119
+ labelmap : evaluator/Evaluation/ava_action_list_v2.2_for_activitynet_2019.pbtxt
120
+ groundtruth : evaluator/Evaluation/ava_val_v2.2.csv
121
+ detections : ava_result/ava_predicted_file.csv
122
+
123
+
124
+ idx2name:
125
+ 0 : bend/bow (at the waist)
126
+ 1 : crawl
127
+ 2 : crouch/kneel
128
+ 3 : dance
129
+ 4 : fall down
130
+ 5 : get up
131
+ 6 : jump/leap
132
+ 7 : lie/sleep
133
+ 8 : martial art
134
+ 9 : run/jog
135
+ 10 : sit
136
+ 11 : stand
137
+ 12 : swim
138
+ 13 : walk
139
+ 14 : answer phone
140
+ 15 : brush teeth
141
+ 16 : carry/hold (an object)
142
+ 17 : catch (an object)
143
+ 18 : chop
144
+ 19 : climb (e.g., a mountain)
145
+ 20 : clink glass
146
+ 21 : close (e.g., a door, a box)
147
+ 22 : cook
148
+ 23 : cut
149
+ 24 : dig
150
+ 25 : dress/put on clothing
151
+ 26 : drink
152
+ 27 : drive (e.g., a car, a truck)
153
+ 28 : eat
154
+ 29 : enter
155
+ 30 : exit
156
+ 31 : extract
157
+ 32 : fishing
158
+ 33 : hit (an object)
159
+ 34 : kick (an object)
160
+ 35 : lift/pick up
161
+ 36 : listen (e.g., to music)
162
+ 37 : open (e.g., a window, a car door)
163
+ 38 : paint
164
+ 39 : play board game
165
+ 40 : play musical instrument
166
+ 41 : play with pets
167
+ 42 : point to (an object)
168
+ 43 : press
169
+ 44 : pull (an object)
170
+ 45 : push (an object)
171
+ 46 : put down
172
+ 47 : read
173
+ 48 : ride (e.g., a bike, a car, a horse)
174
+ 49 : row boat
175
+ 50 : sail boat
176
+ 51 : shoot
177
+ 52 : shovel
178
+ 53 : smoke
179
+ 54 : stir
180
+ 55 : take a photo
181
+ 56 : text on/look at a cellphone
182
+ 57 : throw
183
+ 58 : touch (an object)
184
+ 59 : turn (e.g., a screwdriver)
185
+ 60 : watch (e.g., TV)
186
+ 61 : work on a computer
187
+ 62 : write
188
+ 63 : fight/hit (a person)
189
+ 64 : give/serve (an object) to (a person)
190
+ 65 : grab (a person)
191
+ 66 : hand clap
192
+ 67 : hand shake
193
+ 68 : hand wave
194
+ 69 : hug (a person)
195
+ 70 : kick (a person)
196
+ 71 : kiss (a person)
197
+ 72 : lift (a person)
198
+ 73 : listen to (a person)
199
+ 74 : play with kids
200
+ 75 : push (another person)
201
+ 76 : sing to (e.g., self, a person, a group)
202
+ 77 : take (an object) from (a person)
203
+ 78 : talk to (e.g., self, a person, a group)
204
+ 79 : watch (a person)
205
+
206
+
207
+ train_class_count:
208
+ 0 : 8322
209
+ 1 : 157
210
+ 2 : 2309
211
+ 3 : 3239
212
+ 4 : 291
213
+ 5 : 1120
214
+ 6 : 245
215
+ 7 : 5349
216
+ 8 : 2102
217
+ 9 : 3308
218
+ 10 : 99884
219
+ 11 : 165387
220
+ 12 : 110
221
+ 13 : 40341
222
+ 14 : 3275
223
+ 15 : 20
224
+ 16 : 80025
225
+ 17 : 80
226
+ 18 : 36
227
+ 19 : 267
228
+ 20 : 53
229
+ 21 : 784
230
+ 22 : 65
231
+ 23 : 184
232
+ 24 : 41
233
+ 25 : 342
234
+ 26 : 2319
235
+ 27 : 1187
236
+ 28 : 3012
237
+ 29 : 221
238
+ 30 : 53
239
+ 31 : 7
240
+ 32 : 79
241
+ 33 : 177
242
+ 34 : 35
243
+ 35 : 518
244
+ 36 : 660
245
+ 37 : 1247
246
+ 38 : 67
247
+ 39 : 117
248
+ 40 : 1290
249
+ 41 : 138
250
+ 42 : 97
251
+ 43 : 94
252
+ 44 : 341
253
+ 45 : 385
254
+ 46 : 533
255
+ 47 : 2141
256
+ 48 : 4784
257
+ 49 : 62
258
+ 50 : 712
259
+ 51 : 219
260
+ 52 : 67
261
+ 53 : 2986
262
+ 54 : 59
263
+ 55 : 180
264
+ 56 : 415
265
+ 57 : 248
266
+ 58 : 17077
267
+ 59 : 135
268
+ 60 : 1983
269
+ 61 : 176
270
+ 62 : 773
271
+ 63 : 2691
272
+ 64 : 1073
273
+ 65 : 1993
274
+ 66 : 1175
275
+ 67 : 619
276
+ 68 : 343
277
+ 69 : 1101
278
+ 70 : 50
279
+ 71 : 714
280
+ 72 : 400
281
+ 73 : 106175
282
+ 74 : 127
283
+ 75 : 355
284
+ 76 : 1638
285
+ 77 : 608
286
+ 78 : 110151
287
+ 79 : 167115
288
+
289
+
290
+ class_ratio:
291
+ 79: 0.5059319458527529
292
+ 11: 0.5005430972490094
293
+ 78: 0.3317767554377424
294
+ 73: 0.32139321745252786
295
+ 10: 0.3018567607333167
296
+ 16: 0.24206491290886498
297
+ 13: 0.12267378359756043
298
+ 58: 0.05155061034502472
299
+ 0: 0.02512088050957867
300
+ 7: 0.016115395377806128
301
+ 48: 0.014466546112115732
302
+ 9: 0.010040529196366514
303
+ 14: 0.00986601595291753
304
+ 3: 0.00982990976461774
305
+ 28: 0.009101768300571982
306
+ 53: 0.008999467433722578
307
+ 63: 0.008108848122327766
308
+ 26: 0.007025662473334075
309
+ 2: 0.006983538586984321
310
+ 47: 0.006456990007612388
311
+ 8: 0.006369733385887896
312
+ 65: 0.006026724597039895
313
+ 60: 0.0059966361067900695
314
+ 76: 0.004943538948046204
315
+ 40: 0.003902477185402268
316
+ 37: 0.0037640701302530744
317
+ 27: 0.0035745126416791783
318
+ 66: 0.003571503792654196
319
+ 5: 0.0033819463040803003
320
+ 69: 0.0033187604745556682
321
+ 64: 0.003228495003806194
322
+ 21: 0.0023649553336362243
323
+ 62: 0.002337875692411382
324
+ 50: 0.0021633624489623983
325
+ 71: 0.002148318203837486
326
+ 36: 0.0020099111486882922
327
+ 67: 0.001862477546464151
328
+ 77: 0.0018293802071893438
329
+ 46: 0.0016037165303156584
330
+ 35: 0.0015615926439659037
331
+ 56: 0.0012486723453677265
332
+ 72: 0.0012035396099929893
333
+ 45: 0.0011644245726682172
334
+ 75: 0.0010681414038687781
335
+ 68: 0.001056106007768848
336
+ 44: 0.001035044064593971
337
+ 25: 0.001029026366544006
338
+ 4: 0.0008755750662698998
339
+ 19: 0.0008063715386953028
340
+ 57: 0.0007492034072206358
341
+ 6: 0.000737168011120706
342
+ 29: 0.0006769910306210565
343
+ 51: 0.0006679644835461091
344
+ 23: 0.0005536282205967751
345
+ 55: 0.0005446016735218277
346
+ 33: 0.0005325662774218978
347
+ 61: 0.0005295574283969153
348
+ 1: 0.0004723892969222483
349
+ 41: 0.0004152211654475813
350
+ 59: 0.00041221231642259886
351
+ 74: 0.00038212382617277413
352
+ 39: 0.00035504418494793186
353
+ 12: 0.00033398224177305457
354
+ 42: 0.00029185835542329993
355
+ 43: 0.0002828318083483525
356
+ 17: 0.00024070792199859788
357
+ 32: 0.0002376990729736154
358
+ 38: 0.0002015928846738257
359
+ 52: 0.0002015928846738257
360
+ 22: 0.00019557518662386078
361
+ 49: 0.00018654863954891334
362
+ 54: 0.00018053094149894842
363
+ 20: 0.0001594689983240711
364
+ 30: 0.0001594689983240711
365
+ 70: 0.00015044245124912366
366
+ 24: 0.00012336281002428142
367
+ 18: 0.00010831856489936904
368
+ 34: 0.00010530971587438658
369
+ 15: 6.017698049964947e-05
370
+ 31: 2.1061943174877314e-05
ava/CBAM/ema_epoch_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71977f0063b8a106fb50d86a54aa3550c505286c4963b58b1ec5b403940f6fae
3
+ size 210567010
ava/CBAM/ema_epoch_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf7252425bd33f036c82141899855258967d23b8cc923eea904d590cf735c01
3
+ size 210567010
ava/CBAM/ema_epoch_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b2722d035b78d9506344f319a1595ee00206473f4f6441ac4c79f3f6d264490
3
+ size 210567010
ava/CBAM/ema_epoch_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8b2d63e21976a4dc57ad3bc516b46c9e0c3c90804335df163546a8850b30e15
3
+ size 210567010
ava/CBAM/ema_epoch_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1f8d4d4844a0b42e325dd444c0373367fa29f551c3c354d264cc42d0bc292fd
3
+ size 210567010
ava/CBAM/ema_epoch_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef9c899553f3ffda920cc51ea42d20a3acc3bd26e8e7cd83daf3b5b843b600d4
3
+ size 210567010
ava/CBAM/ema_epoch_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6d4ad32cc23313d69c1b18b718e9fad325488a169c45044d74d71102fec4ffd
3
+ size 210567010
ava/CBAM/ema_epoch_8.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b3777e33a247e2cfce8e2751bb13a5d3a5b35552735a97a52df61e73d5e03a4
3
+ size 210567010
ava/CBAM/ema_epoch_9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:854bea7cb7c5f077b642a75cc1b8090948139971252c3db4b060aa977cf95609
3
+ size 210567010
ava/CBAM/epoch_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41ad1cb17f3c7a15ebd7ca36fcb7f8b1dd47fe25484b91ff2297dd3e3059890f
3
+ size 210559982
ava/CBAM/epoch_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:835b626c8ed6fcc77bbc5e2004714209905a4238668dabb289160cc69c7b2ca9
3
+ size 210559982
ava/CBAM/epoch_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9261a40bcf7de7f493ea73aaa0595f64292fa83e07121bc05452eb94b4f1a4f
3
+ size 210559982
ava/CBAM/epoch_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc0e034a5dec5db2c80540a9d502284e3eaab2e90f847846e3536827ec9600c0
3
+ size 210559982
ava/CBAM/epoch_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a0b095045348de1ee0ea46ed5e0e24a7343d664782bc4f3758b0b67e42e0211
3
+ size 210559982
ava/CBAM/epoch_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00608d36a60054a2a9a5f76e74868c6be6816deb23a98cbbb0ed3126da3887e7
3
+ size 210559982
ava/CBAM/epoch_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c0df243e1ff87031c85053f97ff9a1fd2ff85f9bfa489d8f52daaccb9ed81cc
3
+ size 210559982
ava/CBAM/epoch_8.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e16156daed94476cb80e3367a41ae78005fd1dcac6024b1219340b07a48d05b7
3
+ size 210559982
ava/CBAM/epoch_9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bcdc0e391421d29119cd86b85e6eb97257759fb379c179f75ab09e19d483fd0
3
+ size 210559982
ava/CBAM/logging.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ epoch : 9, update : 1440, loss = 3.2836099416017532
ava/Channel/config.yaml ADDED
@@ -0,0 +1,381 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BACKBONE2D:
2
+ YOLOv8:
3
+ ver : m
4
+
5
+ PRETRAIN:
6
+ n : weights/backbone2D/YOLOv8/v8_n.pth
7
+ s : weights/backbone2D/YOLOv8/v8_s.pth
8
+ m : weights/backbone2D/YOLOv8/v8_m.pth
9
+ l : weights/backbone2D/YOLOv8/v8_l.pth
10
+ x : weights/backbone2D/YOLOv8/v8_x.pth
11
+
12
+ BACKBONE3D:
13
+
14
+ MOBILENET:
15
+ width_mult: 2.0
16
+
17
+ PRETRAIN:
18
+ width_mult_0.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_0.5x_RGB_16_best.pth
19
+ width_mult_1.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.0x_RGB_16_best.pth
20
+ width_mult_1.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.5x_RGB_16_best.pth
21
+ width_mult_2.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_2.0x_RGB_16_best.pth
22
+
23
+ MOBILENETv2:
24
+ width_mult: 1.0
25
+
26
+ PRETRAIN:
27
+ width_mult_0.2x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.2x_RGB_16_best.pth
28
+ width_mult_0.45x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.45x_RGB_16_best.pth
29
+ width_mult_0.7x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.7x_RGB_16_best.pth
30
+ width_mult_1.0x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_1.0x_RGB_16_best.pth
31
+
32
+ SHUFFLENET:
33
+ width_mult: 2.0
34
+
35
+ PRETRAIN:
36
+ width_mult_0.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_0.5x_G3_RGB_16_best.pth
37
+ width_mult_1.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.0x_G3_RGB_16_best.pth
38
+ width_mult_1.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.5x_G3_RGB_16_best.pth
39
+ width_mult_2.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_2.0x_G3_RGB_16_best.pth
40
+
41
+ SHUFFLENETv2:
42
+ width_mult: 2.0
43
+
44
+ PRETRAIN:
45
+ width_mult_0.25x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_0.25x_RGB_16_best.pth
46
+ width_mult_1.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.0x_RGB_16_best.pth
47
+ width_mult_1.5x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.5x_RGB_16_best.pth
48
+ width_mult_2.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_2.0x_RGB_16_best.pth
49
+
50
+ I3D:
51
+ PRETRAIN:
52
+ default: weights/backbone3D/I3D/rgb_imagenet.pth
53
+
54
+ RESNET:
55
+ ver : 101
56
+
57
+ PRETRAIN:
58
+ ver_18 : weights/backbone3D/resnet/kinetics_resnet_18_RGB_16_best.pth
59
+ ver_50 : weights/backbone3D/resnet/kinetics_resnet_50_RGB_16_best.pth
60
+ ver_101: weights/backbone3D/resnet/kinetics_resnet_101_RGB_16_best.pth
61
+
62
+ RESNEXT:
63
+ ver : 101
64
+
65
+ PRETRAIN:
66
+ ver_101 : weights/backbone3D/resnext/resnext-101-kinetics.pth
67
+
68
+ LOSS:
69
+ TAL:
70
+ top_k : 10
71
+ alpha : 0.5
72
+ beta : 6.0
73
+ radius : 2.5
74
+ soft_label : False
75
+
76
+ scale_cls_loss : 0.5
77
+ scale_box_loss : 7.5
78
+ scale_dfl_loss : 1.5
79
+
80
+ SIMOTA:
81
+ top_k : 10
82
+ gamma : 0.5
83
+ radius : 2.5
84
+ mode : unbalance
85
+ soft_label : True
86
+
87
+ dynamic_k : False
88
+ dynamic_top_k : 10
89
+
90
+ scale_cls_loss : 0.5
91
+ scale_box_loss : 5.0
92
+ scale_dfl_loss : 0.5
93
+
94
+ NORMAL:
95
+ top_k : 10
96
+ radius : 2.5
97
+
98
+ dynamic_k : True
99
+ dynamic_top_k : 10
100
+
101
+ scale_cls_loss : 1.0
102
+ scale_box_loss : 5.0
103
+ scale_dfl_loss : 1.0
104
+
105
+ config_path : config/cf/ava.yaml
106
+ dataset : ava
107
+ loss : simota
108
+ active_checker : True
109
+ num_classes : 80
110
+ backbone2D : yolov8
111
+ backbone3D : i3d
112
+ fusion_module : Channel
113
+ mode : decoupled
114
+ interchannels : [256, 256, 256]
115
+ pretrain_path : weights/fig1/ava/Channel/ema_epoch_9.pth
116
+ data_root : /home/manh/Datasets/ava
117
+ img_size : 224
118
+ clip_length : 16
119
+ batch_size : 8
120
+ num_workers : 6
121
+ acc_grad : 16
122
+ lr : 0.0001
123
+ weight_decay : 0.0005
124
+ max_step_warmup : 500
125
+ adjustlr_schedule : [3, 4, 5, 6]
126
+ max_epoch : 9
127
+ lr_decay : 0.5
128
+ save_folder : weights/fig1/ava/Channel
129
+ sampling_rate : 1
130
+ labelmap : evaluator/Evaluation/ava_action_list_v2.2_for_activitynet_2019.pbtxt
131
+ groundtruth : evaluator/Evaluation/ava_val_v2.2.csv
132
+ detections : ava_result/ava_predicted_file.csv
133
+
134
+
135
+ idx2name:
136
+ 0 : bend/bow (at the waist)
137
+ 1 : crawl
138
+ 2 : crouch/kneel
139
+ 3 : dance
140
+ 4 : fall down
141
+ 5 : get up
142
+ 6 : jump/leap
143
+ 7 : lie/sleep
144
+ 8 : martial art
145
+ 9 : run/jog
146
+ 10 : sit
147
+ 11 : stand
148
+ 12 : swim
149
+ 13 : walk
150
+ 14 : answer phone
151
+ 15 : brush teeth
152
+ 16 : carry/hold (an object)
153
+ 17 : catch (an object)
154
+ 18 : chop
155
+ 19 : climb (e.g., a mountain)
156
+ 20 : clink glass
157
+ 21 : close (e.g., a door, a box)
158
+ 22 : cook
159
+ 23 : cut
160
+ 24 : dig
161
+ 25 : dress/put on clothing
162
+ 26 : drink
163
+ 27 : drive (e.g., a car, a truck)
164
+ 28 : eat
165
+ 29 : enter
166
+ 30 : exit
167
+ 31 : extract
168
+ 32 : fishing
169
+ 33 : hit (an object)
170
+ 34 : kick (an object)
171
+ 35 : lift/pick up
172
+ 36 : listen (e.g., to music)
173
+ 37 : open (e.g., a window, a car door)
174
+ 38 : paint
175
+ 39 : play board game
176
+ 40 : play musical instrument
177
+ 41 : play with pets
178
+ 42 : point to (an object)
179
+ 43 : press
180
+ 44 : pull (an object)
181
+ 45 : push (an object)
182
+ 46 : put down
183
+ 47 : read
184
+ 48 : ride (e.g., a bike, a car, a horse)
185
+ 49 : row boat
186
+ 50 : sail boat
187
+ 51 : shoot
188
+ 52 : shovel
189
+ 53 : smoke
190
+ 54 : stir
191
+ 55 : take a photo
192
+ 56 : text on/look at a cellphone
193
+ 57 : throw
194
+ 58 : touch (an object)
195
+ 59 : turn (e.g., a screwdriver)
196
+ 60 : watch (e.g., TV)
197
+ 61 : work on a computer
198
+ 62 : write
199
+ 63 : fight/hit (a person)
200
+ 64 : give/serve (an object) to (a person)
201
+ 65 : grab (a person)
202
+ 66 : hand clap
203
+ 67 : hand shake
204
+ 68 : hand wave
205
+ 69 : hug (a person)
206
+ 70 : kick (a person)
207
+ 71 : kiss (a person)
208
+ 72 : lift (a person)
209
+ 73 : listen to (a person)
210
+ 74 : play with kids
211
+ 75 : push (another person)
212
+ 76 : sing to (e.g., self, a person, a group)
213
+ 77 : take (an object) from (a person)
214
+ 78 : talk to (e.g., self, a person, a group)
215
+ 79 : watch (a person)
216
+
217
+
218
+ train_class_count:
219
+ 0 : 8322
220
+ 1 : 157
221
+ 2 : 2309
222
+ 3 : 3239
223
+ 4 : 291
224
+ 5 : 1120
225
+ 6 : 245
226
+ 7 : 5349
227
+ 8 : 2102
228
+ 9 : 3308
229
+ 10 : 99884
230
+ 11 : 165387
231
+ 12 : 110
232
+ 13 : 40341
233
+ 14 : 3275
234
+ 15 : 20
235
+ 16 : 80025
236
+ 17 : 80
237
+ 18 : 36
238
+ 19 : 267
239
+ 20 : 53
240
+ 21 : 784
241
+ 22 : 65
242
+ 23 : 184
243
+ 24 : 41
244
+ 25 : 342
245
+ 26 : 2319
246
+ 27 : 1187
247
+ 28 : 3012
248
+ 29 : 221
249
+ 30 : 53
250
+ 31 : 7
251
+ 32 : 79
252
+ 33 : 177
253
+ 34 : 35
254
+ 35 : 518
255
+ 36 : 660
256
+ 37 : 1247
257
+ 38 : 67
258
+ 39 : 117
259
+ 40 : 1290
260
+ 41 : 138
261
+ 42 : 97
262
+ 43 : 94
263
+ 44 : 341
264
+ 45 : 385
265
+ 46 : 533
266
+ 47 : 2141
267
+ 48 : 4784
268
+ 49 : 62
269
+ 50 : 712
270
+ 51 : 219
271
+ 52 : 67
272
+ 53 : 2986
273
+ 54 : 59
274
+ 55 : 180
275
+ 56 : 415
276
+ 57 : 248
277
+ 58 : 17077
278
+ 59 : 135
279
+ 60 : 1983
280
+ 61 : 176
281
+ 62 : 773
282
+ 63 : 2691
283
+ 64 : 1073
284
+ 65 : 1993
285
+ 66 : 1175
286
+ 67 : 619
287
+ 68 : 343
288
+ 69 : 1101
289
+ 70 : 50
290
+ 71 : 714
291
+ 72 : 400
292
+ 73 : 106175
293
+ 74 : 127
294
+ 75 : 355
295
+ 76 : 1638
296
+ 77 : 608
297
+ 78 : 110151
298
+ 79 : 167115
299
+
300
+
301
+ class_ratio:
302
+ 79: 0.5059319458527529
303
+ 11: 0.5005430972490094
304
+ 78: 0.3317767554377424
305
+ 73: 0.32139321745252786
306
+ 10: 0.3018567607333167
307
+ 16: 0.24206491290886498
308
+ 13: 0.12267378359756043
309
+ 58: 0.05155061034502472
310
+ 0: 0.02512088050957867
311
+ 7: 0.016115395377806128
312
+ 48: 0.014466546112115732
313
+ 9: 0.010040529196366514
314
+ 14: 0.00986601595291753
315
+ 3: 0.00982990976461774
316
+ 28: 0.009101768300571982
317
+ 53: 0.008999467433722578
318
+ 63: 0.008108848122327766
319
+ 26: 0.007025662473334075
320
+ 2: 0.006983538586984321
321
+ 47: 0.006456990007612388
322
+ 8: 0.006369733385887896
323
+ 65: 0.006026724597039895
324
+ 60: 0.0059966361067900695
325
+ 76: 0.004943538948046204
326
+ 40: 0.003902477185402268
327
+ 37: 0.0037640701302530744
328
+ 27: 0.0035745126416791783
329
+ 66: 0.003571503792654196
330
+ 5: 0.0033819463040803003
331
+ 69: 0.0033187604745556682
332
+ 64: 0.003228495003806194
333
+ 21: 0.0023649553336362243
334
+ 62: 0.002337875692411382
335
+ 50: 0.0021633624489623983
336
+ 71: 0.002148318203837486
337
+ 36: 0.0020099111486882922
338
+ 67: 0.001862477546464151
339
+ 77: 0.0018293802071893438
340
+ 46: 0.0016037165303156584
341
+ 35: 0.0015615926439659037
342
+ 56: 0.0012486723453677265
343
+ 72: 0.0012035396099929893
344
+ 45: 0.0011644245726682172
345
+ 75: 0.0010681414038687781
346
+ 68: 0.001056106007768848
347
+ 44: 0.001035044064593971
348
+ 25: 0.001029026366544006
349
+ 4: 0.0008755750662698998
350
+ 19: 0.0008063715386953028
351
+ 57: 0.0007492034072206358
352
+ 6: 0.000737168011120706
353
+ 29: 0.0006769910306210565
354
+ 51: 0.0006679644835461091
355
+ 23: 0.0005536282205967751
356
+ 55: 0.0005446016735218277
357
+ 33: 0.0005325662774218978
358
+ 61: 0.0005295574283969153
359
+ 1: 0.0004723892969222483
360
+ 41: 0.0004152211654475813
361
+ 59: 0.00041221231642259886
362
+ 74: 0.00038212382617277413
363
+ 39: 0.00035504418494793186
364
+ 12: 0.00033398224177305457
365
+ 42: 0.00029185835542329993
366
+ 43: 0.0002828318083483525
367
+ 17: 0.00024070792199859788
368
+ 32: 0.0002376990729736154
369
+ 38: 0.0002015928846738257
370
+ 52: 0.0002015928846738257
371
+ 22: 0.00019557518662386078
372
+ 49: 0.00018654863954891334
373
+ 54: 0.00018053094149894842
374
+ 20: 0.0001594689983240711
375
+ 30: 0.0001594689983240711
376
+ 70: 0.00015044245124912366
377
+ 24: 0.00012336281002428142
378
+ 18: 0.00010831856489936904
379
+ 34: 0.00010530971587438658
380
+ 15: 6.017698049964947e-05
381
+ 31: 2.1061943174877314e-05
ava/Channel/ema_epoch_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7be13db14b745b048d0829ec191f1960b8a1ae0b70e80b70b663b00b542323c8
3
+ size 210545426
ava/Channel/ema_epoch_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be95736677bc7145e4fa8af2c3341d71a70e87fd34d9beff31613de060ce6df4
3
+ size 210545426
ava/Channel/ema_epoch_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f94bcaa676c69b5a8bebd8fad18c5dd6a524b7940ee8803592eb82caef92f94a
3
+ size 210545426
ava/Channel/ema_epoch_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba515a2a18056ff5e5f08b2b0faad38200feca0e0ffb2c380ab29bfc8df66d7c
3
+ size 210545426
ava/Channel/ema_epoch_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4bd3b05386a4792ba0c277a8e1b7ea67494fe22494115b2cc52aa7c776c05a2
3
+ size 210545426
ava/Channel/ema_epoch_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:217b3cf6b50dcc060afcb5314d53fbf34c1681db286621e542bcbb9d79a5d63a
3
+ size 210545426
ava/Channel/ema_epoch_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9af57ae12115d7d81814f92441a3209f15dc098b1866a9a647a93f7f778022
3
+ size 210545426
ava/Channel/ema_epoch_8.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0425702994041a42086b6080a8d17877e02e77df2a4306c23d5a2e31fc160c0b
3
+ size 210545426
ava/Channel/ema_epoch_9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53ad5bf346d1921ab2c6c394fa557b18a2624a861fb41459868e07d1266ff78a
3
+ size 210545426
ava/Channel/epoch_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:748cd188b858db99fadf50bc57a6aee78284f1c3933aa95b2059e86e3fa921e9
3
+ size 210538590
ava/Channel/epoch_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a01fd02bac19c7fa76d6ca7cd152c09b57cc39a1c9bb4a5c103638347663bb18
3
+ size 210538590
ava/Channel/epoch_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f86e311b0dc7b9fc2be25db60c09f6a0e79c00b0f5e05a26ba49512e780a5fb8
3
+ size 210538590
ava/Channel/epoch_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:429648b9b17724aac500aee4cf47c818ab2f2bfad14d484b63bf3c4a18b5293f
3
+ size 210538590
ava/Channel/epoch_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c5da5275c3072fb2d9dcecf335aa3f60f751fde6b8b3b9dc998b0e512c21c31
3
+ size 210538590
ava/Channel/epoch_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:848e9fed6d715a43bcc39ad4bc3b35bbf854d910538519bbbf55f2402930c350
3
+ size 210538590
ava/Channel/epoch_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c33dd3be538aa398ea2187c43d9e54aac4d91626eb2a68c3282417518490ba0
3
+ size 210538590
ava/Channel/epoch_8.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d54f0513a9be70f56de871647d53d79e900fc8556c9135260ca5d49563672b7
3
+ size 210538590
ava/Channel/epoch_9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:361292d7f5625cc5380c45a26ec7122ede15f182bd6e3aa4dddeaa9e0656eedd
3
+ size 210538590
ava/Channel/logging.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ epoch : 9, update : 1440, loss = 3.0980929285287857
ava/LKA/config.yaml ADDED
@@ -0,0 +1,381 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BACKBONE2D:
2
+ YOLOv8:
3
+ ver : m
4
+
5
+ PRETRAIN:
6
+ n : weights/backbone2D/YOLOv8/v8_n.pth
7
+ s : weights/backbone2D/YOLOv8/v8_s.pth
8
+ m : weights/backbone2D/YOLOv8/v8_m.pth
9
+ l : weights/backbone2D/YOLOv8/v8_l.pth
10
+ x : weights/backbone2D/YOLOv8/v8_x.pth
11
+
12
+ BACKBONE3D:
13
+
14
+ MOBILENET:
15
+ width_mult: 2.0
16
+
17
+ PRETRAIN:
18
+ width_mult_0.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_0.5x_RGB_16_best.pth
19
+ width_mult_1.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.0x_RGB_16_best.pth
20
+ width_mult_1.5x : weights/backbone3D/mobilenet/kinetics_mobilenet_1.5x_RGB_16_best.pth
21
+ width_mult_2.0x : weights/backbone3D/mobilenet/kinetics_mobilenet_2.0x_RGB_16_best.pth
22
+
23
+ MOBILENETv2:
24
+ width_mult: 1.0
25
+
26
+ PRETRAIN:
27
+ width_mult_0.2x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.2x_RGB_16_best.pth
28
+ width_mult_0.45x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.45x_RGB_16_best.pth
29
+ width_mult_0.7x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_0.7x_RGB_16_best.pth
30
+ width_mult_1.0x : weights/backbone3D/mobilenetv2/kinetics_mobilenetv2_1.0x_RGB_16_best.pth
31
+
32
+ SHUFFLENET:
33
+ width_mult: 2.0
34
+
35
+ PRETRAIN:
36
+ width_mult_0.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_0.5x_G3_RGB_16_best.pth
37
+ width_mult_1.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.0x_G3_RGB_16_best.pth
38
+ width_mult_1.5x : weights/backbone3D/shufflenet/kinetics_shufflenet_1.5x_G3_RGB_16_best.pth
39
+ width_mult_2.0x : weights/backbone3D/shufflenet/kinetics_shufflenet_2.0x_G3_RGB_16_best.pth
40
+
41
+ SHUFFLENETv2:
42
+ width_mult: 2.0
43
+
44
+ PRETRAIN:
45
+ width_mult_0.25x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_0.25x_RGB_16_best.pth
46
+ width_mult_1.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.0x_RGB_16_best.pth
47
+ width_mult_1.5x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_1.5x_RGB_16_best.pth
48
+ width_mult_2.0x : weights/backbone3D/shufflenetv2/kinetics_shufflenetv2_2.0x_RGB_16_best.pth
49
+
50
+ I3D:
51
+ PRETRAIN:
52
+ default: weights/backbone3D/I3D/rgb_imagenet.pth
53
+
54
+ RESNET:
55
+ ver : 101
56
+
57
+ PRETRAIN:
58
+ ver_18 : weights/backbone3D/resnet/kinetics_resnet_18_RGB_16_best.pth
59
+ ver_50 : weights/backbone3D/resnet/kinetics_resnet_50_RGB_16_best.pth
60
+ ver_101: weights/backbone3D/resnet/kinetics_resnet_101_RGB_16_best.pth
61
+
62
+ RESNEXT:
63
+ ver : 101
64
+
65
+ PRETRAIN:
66
+ ver_101 : weights/backbone3D/resnext/resnext-101-kinetics.pth
67
+
68
+ LOSS:
69
+ TAL:
70
+ top_k : 10
71
+ alpha : 0.5
72
+ beta : 6.0
73
+ radius : 2.5
74
+ soft_label : False
75
+
76
+ scale_cls_loss : 0.5
77
+ scale_box_loss : 7.5
78
+ scale_dfl_loss : 1.5
79
+
80
+ SIMOTA:
81
+ top_k : 10
82
+ gamma : 0.5
83
+ radius : 2.5
84
+ mode : unbalance
85
+ soft_label : True
86
+
87
+ dynamic_k : False
88
+ dynamic_top_k : 10
89
+
90
+ scale_cls_loss : 0.5
91
+ scale_box_loss : 5.0
92
+ scale_dfl_loss : 0.5
93
+
94
+ NORMAL:
95
+ top_k : 10
96
+ radius : 2.5
97
+
98
+ dynamic_k : True
99
+ dynamic_top_k : 10
100
+
101
+ scale_cls_loss : 1.0
102
+ scale_box_loss : 5.0
103
+ scale_dfl_loss : 1.0
104
+
105
+ config_path : config/cf/ava.yaml
106
+ dataset : ava
107
+ loss : simota
108
+ active_checker : True
109
+ num_classes : 80
110
+ backbone2D : yolov8
111
+ backbone3D : i3d
112
+ fusion_module : LKA
113
+ mode : decoupled
114
+ interchannels : [256, 256, 256]
115
+ pretrain_path : weights/fig1/ava/LKA/ema_epoch_9.pth
116
+ data_root : /home/manh/Datasets/ava
117
+ img_size : 224
118
+ clip_length : 16
119
+ batch_size : 8
120
+ num_workers : 6
121
+ acc_grad : 16
122
+ lr : 0.0001
123
+ weight_decay : 0.0005
124
+ max_step_warmup : 500
125
+ adjustlr_schedule : [3, 4, 5, 6]
126
+ max_epoch : 9
127
+ lr_decay : 0.5
128
+ save_folder : weights/fig1/ava/LKA
129
+ sampling_rate : 1
130
+ labelmap : evaluator/Evaluation/ava_action_list_v2.2_for_activitynet_2019.pbtxt
131
+ groundtruth : evaluator/Evaluation/ava_val_v2.2.csv
132
+ detections : ava_result/ava_predicted_file.csv
133
+
134
+
135
+ idx2name:
136
+ 0 : bend/bow (at the waist)
137
+ 1 : crawl
138
+ 2 : crouch/kneel
139
+ 3 : dance
140
+ 4 : fall down
141
+ 5 : get up
142
+ 6 : jump/leap
143
+ 7 : lie/sleep
144
+ 8 : martial art
145
+ 9 : run/jog
146
+ 10 : sit
147
+ 11 : stand
148
+ 12 : swim
149
+ 13 : walk
150
+ 14 : answer phone
151
+ 15 : brush teeth
152
+ 16 : carry/hold (an object)
153
+ 17 : catch (an object)
154
+ 18 : chop
155
+ 19 : climb (e.g., a mountain)
156
+ 20 : clink glass
157
+ 21 : close (e.g., a door, a box)
158
+ 22 : cook
159
+ 23 : cut
160
+ 24 : dig
161
+ 25 : dress/put on clothing
162
+ 26 : drink
163
+ 27 : drive (e.g., a car, a truck)
164
+ 28 : eat
165
+ 29 : enter
166
+ 30 : exit
167
+ 31 : extract
168
+ 32 : fishing
169
+ 33 : hit (an object)
170
+ 34 : kick (an object)
171
+ 35 : lift/pick up
172
+ 36 : listen (e.g., to music)
173
+ 37 : open (e.g., a window, a car door)
174
+ 38 : paint
175
+ 39 : play board game
176
+ 40 : play musical instrument
177
+ 41 : play with pets
178
+ 42 : point to (an object)
179
+ 43 : press
180
+ 44 : pull (an object)
181
+ 45 : push (an object)
182
+ 46 : put down
183
+ 47 : read
184
+ 48 : ride (e.g., a bike, a car, a horse)
185
+ 49 : row boat
186
+ 50 : sail boat
187
+ 51 : shoot
188
+ 52 : shovel
189
+ 53 : smoke
190
+ 54 : stir
191
+ 55 : take a photo
192
+ 56 : text on/look at a cellphone
193
+ 57 : throw
194
+ 58 : touch (an object)
195
+ 59 : turn (e.g., a screwdriver)
196
+ 60 : watch (e.g., TV)
197
+ 61 : work on a computer
198
+ 62 : write
199
+ 63 : fight/hit (a person)
200
+ 64 : give/serve (an object) to (a person)
201
+ 65 : grab (a person)
202
+ 66 : hand clap
203
+ 67 : hand shake
204
+ 68 : hand wave
205
+ 69 : hug (a person)
206
+ 70 : kick (a person)
207
+ 71 : kiss (a person)
208
+ 72 : lift (a person)
209
+ 73 : listen to (a person)
210
+ 74 : play with kids
211
+ 75 : push (another person)
212
+ 76 : sing to (e.g., self, a person, a group)
213
+ 77 : take (an object) from (a person)
214
+ 78 : talk to (e.g., self, a person, a group)
215
+ 79 : watch (a person)
216
+
217
+
218
+ train_class_count:
219
+ 0 : 8322
220
+ 1 : 157
221
+ 2 : 2309
222
+ 3 : 3239
223
+ 4 : 291
224
+ 5 : 1120
225
+ 6 : 245
226
+ 7 : 5349
227
+ 8 : 2102
228
+ 9 : 3308
229
+ 10 : 99884
230
+ 11 : 165387
231
+ 12 : 110
232
+ 13 : 40341
233
+ 14 : 3275
234
+ 15 : 20
235
+ 16 : 80025
236
+ 17 : 80
237
+ 18 : 36
238
+ 19 : 267
239
+ 20 : 53
240
+ 21 : 784
241
+ 22 : 65
242
+ 23 : 184
243
+ 24 : 41
244
+ 25 : 342
245
+ 26 : 2319
246
+ 27 : 1187
247
+ 28 : 3012
248
+ 29 : 221
249
+ 30 : 53
250
+ 31 : 7
251
+ 32 : 79
252
+ 33 : 177
253
+ 34 : 35
254
+ 35 : 518
255
+ 36 : 660
256
+ 37 : 1247
257
+ 38 : 67
258
+ 39 : 117
259
+ 40 : 1290
260
+ 41 : 138
261
+ 42 : 97
262
+ 43 : 94
263
+ 44 : 341
264
+ 45 : 385
265
+ 46 : 533
266
+ 47 : 2141
267
+ 48 : 4784
268
+ 49 : 62
269
+ 50 : 712
270
+ 51 : 219
271
+ 52 : 67
272
+ 53 : 2986
273
+ 54 : 59
274
+ 55 : 180
275
+ 56 : 415
276
+ 57 : 248
277
+ 58 : 17077
278
+ 59 : 135
279
+ 60 : 1983
280
+ 61 : 176
281
+ 62 : 773
282
+ 63 : 2691
283
+ 64 : 1073
284
+ 65 : 1993
285
+ 66 : 1175
286
+ 67 : 619
287
+ 68 : 343
288
+ 69 : 1101
289
+ 70 : 50
290
+ 71 : 714
291
+ 72 : 400
292
+ 73 : 106175
293
+ 74 : 127
294
+ 75 : 355
295
+ 76 : 1638
296
+ 77 : 608
297
+ 78 : 110151
298
+ 79 : 167115
299
+
300
+
301
+ class_ratio:
302
+ 79: 0.5059319458527529
303
+ 11: 0.5005430972490094
304
+ 78: 0.3317767554377424
305
+ 73: 0.32139321745252786
306
+ 10: 0.3018567607333167
307
+ 16: 0.24206491290886498
308
+ 13: 0.12267378359756043
309
+ 58: 0.05155061034502472
310
+ 0: 0.02512088050957867
311
+ 7: 0.016115395377806128
312
+ 48: 0.014466546112115732
313
+ 9: 0.010040529196366514
314
+ 14: 0.00986601595291753
315
+ 3: 0.00982990976461774
316
+ 28: 0.009101768300571982
317
+ 53: 0.008999467433722578
318
+ 63: 0.008108848122327766
319
+ 26: 0.007025662473334075
320
+ 2: 0.006983538586984321
321
+ 47: 0.006456990007612388
322
+ 8: 0.006369733385887896
323
+ 65: 0.006026724597039895
324
+ 60: 0.0059966361067900695
325
+ 76: 0.004943538948046204
326
+ 40: 0.003902477185402268
327
+ 37: 0.0037640701302530744
328
+ 27: 0.0035745126416791783
329
+ 66: 0.003571503792654196
330
+ 5: 0.0033819463040803003
331
+ 69: 0.0033187604745556682
332
+ 64: 0.003228495003806194
333
+ 21: 0.0023649553336362243
334
+ 62: 0.002337875692411382
335
+ 50: 0.0021633624489623983
336
+ 71: 0.002148318203837486
337
+ 36: 0.0020099111486882922
338
+ 67: 0.001862477546464151
339
+ 77: 0.0018293802071893438
340
+ 46: 0.0016037165303156584
341
+ 35: 0.0015615926439659037
342
+ 56: 0.0012486723453677265
343
+ 72: 0.0012035396099929893
344
+ 45: 0.0011644245726682172
345
+ 75: 0.0010681414038687781
346
+ 68: 0.001056106007768848
347
+ 44: 0.001035044064593971
348
+ 25: 0.001029026366544006
349
+ 4: 0.0008755750662698998
350
+ 19: 0.0008063715386953028
351
+ 57: 0.0007492034072206358
352
+ 6: 0.000737168011120706
353
+ 29: 0.0006769910306210565
354
+ 51: 0.0006679644835461091
355
+ 23: 0.0005536282205967751
356
+ 55: 0.0005446016735218277
357
+ 33: 0.0005325662774218978
358
+ 61: 0.0005295574283969153
359
+ 1: 0.0004723892969222483
360
+ 41: 0.0004152211654475813
361
+ 59: 0.00041221231642259886
362
+ 74: 0.00038212382617277413
363
+ 39: 0.00035504418494793186
364
+ 12: 0.00033398224177305457
365
+ 42: 0.00029185835542329993
366
+ 43: 0.0002828318083483525
367
+ 17: 0.00024070792199859788
368
+ 32: 0.0002376990729736154
369
+ 38: 0.0002015928846738257
370
+ 52: 0.0002015928846738257
371
+ 22: 0.00019557518662386078
372
+ 49: 0.00018654863954891334
373
+ 54: 0.00018053094149894842
374
+ 20: 0.0001594689983240711
375
+ 30: 0.0001594689983240711
376
+ 70: 0.00015044245124912366
377
+ 24: 0.00012336281002428142
378
+ 18: 0.00010831856489936904
379
+ 34: 0.00010530971587438658
380
+ 15: 6.017698049964947e-05
381
+ 31: 2.1061943174877314e-05
ava/LKA/ema_epoch_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c404dc7f0bb1e3146f3eae8a20b04252166cea4934c361bc955f9c085c2622eb
3
+ size 212382830
ava/LKA/ema_epoch_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94d982251ef0b2087863d2a434c61717eb2eeaf13ac4ab960fe531d9b99ead3d
3
+ size 212382830
ava/LKA/ema_epoch_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f585aaae1b746447db72e95803752c2b492536c81da920f855786fe8fca1e3b9
3
+ size 212382830
ava/LKA/ema_epoch_4.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28ef552393a0a23d42995de0d2ed7b962b0cd543e77538a7f8b387edd335e3d0
3
+ size 212382830
ava/LKA/ema_epoch_5.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642fb6a14d9898e2a0e5b42e7ec3f7612c2a940214df5e8658e0e12550bbda04
3
+ size 212382830
ava/LKA/ema_epoch_6.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b85d0769466b884f3da69dd5107a6f979e9b1d7a1becd4f1bbcba44d191ffe22
3
+ size 212382830
ava/LKA/ema_epoch_7.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a242014f5ae6c5b958a562a7780efa7761f3eb13d084254718304c4085719c3d
3
+ size 212382830
ava/LKA/ema_epoch_8.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9c20112c9b6b0115b59b91fea5acc721da84e1664e53116f0487e0fe01b715
3
+ size 212382830
ava/LKA/ema_epoch_9.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:879e7704aff12fff9ce961047d8479ee8da299857a26dac3059b64ffe87b686c
3
+ size 212382830