justin-onda commited on
Commit
898e848
·
1 Parent(s): 575aa0e

encoder를 dino v2 공식 모델로 변경

Browse files
Files changed (3) hide show
  1. encoder.onnx +2 -2
  2. model_info.json +0 -112
  3. preprocessor_config.json +27 -0
encoder.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab6d6bebf6eb8a3aa75071ff89c6f4e4f2877d325ac192428fe16254ffcf2396
3
- size 1213332927
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fabcbe2e231b7b2035588329ec6df427c08baa8723eb31546c52738888013ca
3
+ size 1218043280
model_info.json DELETED
@@ -1,112 +0,0 @@
1
- {
2
- "model_architecture": {
3
- "backbone": "vit_large_patch14_dinov2.lvd142m",
4
- "feature_dim": 1024,
5
- "total_parameters": 303252502,
6
- "trainable_parameters": 24598,
7
- "freeze_backbone": true
8
- },
9
- "input_specification": {
10
- "image_size": [
11
- 224,
12
- 224
13
- ],
14
- "channels": 3,
15
- "pixel_range": [
16
- 0.0,
17
- 1.0
18
- ],
19
- "normalization": {
20
- "mean": [
21
- 0.485,
22
- 0.456,
23
- 0.406
24
- ],
25
- "std": [
26
- 0.229,
27
- 0.224,
28
- 0.225
29
- ],
30
- "description": "ImageNet normalization for DINOv2"
31
- },
32
- "input_format": "RGB",
33
- "tensor_layout": "NCHW"
34
- },
35
- "output_specification": {
36
- "heads": {
37
- "scene": {
38
- "num_classes": 6,
39
- "output_type": "logits",
40
- "activation": "softmax",
41
- "classes": [
42
- 16000001,
43
- 16000002,
44
- 16000006,
45
- 16000008,
46
- 16000009,
47
- 16000011
48
- ]
49
- },
50
- "concept": {
51
- "num_classes": 3,
52
- "output_type": "logits",
53
- "activation": "softmax",
54
- "classes": [
55
- 17000001,
56
- 17000002,
57
- 17000003
58
- ]
59
- },
60
- "object": {
61
- "num_classes": 13,
62
- "output_type": "logits",
63
- "activation": "softmax",
64
- "classes": [
65
- 18000001,
66
- 18000002,
67
- 18000004,
68
- 18000005,
69
- 18000006,
70
- 18000007,
71
- 18000008,
72
- 18000009,
73
- 18000010,
74
- 18000012,
75
- 18000014,
76
- 18000016,
77
- "unclassified"
78
- ]
79
- }
80
- }
81
- },
82
- "class_mappings": {
83
- "scene": {
84
- "0": 16000001,
85
- "1": 16000002,
86
- "2": 16000006,
87
- "3": 16000008,
88
- "4": 16000009,
89
- "5": 16000011
90
- },
91
- "concept": {
92
- "0": 17000001,
93
- "1": 17000002,
94
- "2": 17000003
95
- },
96
- "object": {
97
- "0": 18000001,
98
- "1": 18000002,
99
- "2": 18000004,
100
- "3": 18000005,
101
- "4": 18000006,
102
- "5": 18000007,
103
- "6": 18000008,
104
- "7": 18000009,
105
- "8": 18000010,
106
- "9": 18000012,
107
- "10": 18000014,
108
- "11": 18000016,
109
- "12": "unclassified"
110
- }
111
- }
112
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
preprocessor_config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.485,
13
+ 0.456,
14
+ 0.406
15
+ ],
16
+ "image_processor_type": "BitImageProcessor",
17
+ "image_std": [
18
+ 0.229,
19
+ 0.224,
20
+ 0.225
21
+ ],
22
+ "resample": 3,
23
+ "rescale_factor": 0.00392156862745098,
24
+ "size": {
25
+ "shortest_edge": 256
26
+ }
27
+ }