Commit
·
898e848
1
Parent(s):
575aa0e
encoder를 dino v2 공식 모델로 변경
Browse files- encoder.onnx +2 -2
- model_info.json +0 -112
- preprocessor_config.json +27 -0
encoder.onnx
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2fabcbe2e231b7b2035588329ec6df427c08baa8723eb31546c52738888013ca
|
| 3 |
+
size 1218043280
|
model_info.json
DELETED
|
@@ -1,112 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"model_architecture": {
|
| 3 |
-
"backbone": "vit_large_patch14_dinov2.lvd142m",
|
| 4 |
-
"feature_dim": 1024,
|
| 5 |
-
"total_parameters": 303252502,
|
| 6 |
-
"trainable_parameters": 24598,
|
| 7 |
-
"freeze_backbone": true
|
| 8 |
-
},
|
| 9 |
-
"input_specification": {
|
| 10 |
-
"image_size": [
|
| 11 |
-
224,
|
| 12 |
-
224
|
| 13 |
-
],
|
| 14 |
-
"channels": 3,
|
| 15 |
-
"pixel_range": [
|
| 16 |
-
0.0,
|
| 17 |
-
1.0
|
| 18 |
-
],
|
| 19 |
-
"normalization": {
|
| 20 |
-
"mean": [
|
| 21 |
-
0.485,
|
| 22 |
-
0.456,
|
| 23 |
-
0.406
|
| 24 |
-
],
|
| 25 |
-
"std": [
|
| 26 |
-
0.229,
|
| 27 |
-
0.224,
|
| 28 |
-
0.225
|
| 29 |
-
],
|
| 30 |
-
"description": "ImageNet normalization for DINOv2"
|
| 31 |
-
},
|
| 32 |
-
"input_format": "RGB",
|
| 33 |
-
"tensor_layout": "NCHW"
|
| 34 |
-
},
|
| 35 |
-
"output_specification": {
|
| 36 |
-
"heads": {
|
| 37 |
-
"scene": {
|
| 38 |
-
"num_classes": 6,
|
| 39 |
-
"output_type": "logits",
|
| 40 |
-
"activation": "softmax",
|
| 41 |
-
"classes": [
|
| 42 |
-
16000001,
|
| 43 |
-
16000002,
|
| 44 |
-
16000006,
|
| 45 |
-
16000008,
|
| 46 |
-
16000009,
|
| 47 |
-
16000011
|
| 48 |
-
]
|
| 49 |
-
},
|
| 50 |
-
"concept": {
|
| 51 |
-
"num_classes": 3,
|
| 52 |
-
"output_type": "logits",
|
| 53 |
-
"activation": "softmax",
|
| 54 |
-
"classes": [
|
| 55 |
-
17000001,
|
| 56 |
-
17000002,
|
| 57 |
-
17000003
|
| 58 |
-
]
|
| 59 |
-
},
|
| 60 |
-
"object": {
|
| 61 |
-
"num_classes": 13,
|
| 62 |
-
"output_type": "logits",
|
| 63 |
-
"activation": "softmax",
|
| 64 |
-
"classes": [
|
| 65 |
-
18000001,
|
| 66 |
-
18000002,
|
| 67 |
-
18000004,
|
| 68 |
-
18000005,
|
| 69 |
-
18000006,
|
| 70 |
-
18000007,
|
| 71 |
-
18000008,
|
| 72 |
-
18000009,
|
| 73 |
-
18000010,
|
| 74 |
-
18000012,
|
| 75 |
-
18000014,
|
| 76 |
-
18000016,
|
| 77 |
-
"unclassified"
|
| 78 |
-
]
|
| 79 |
-
}
|
| 80 |
-
}
|
| 81 |
-
},
|
| 82 |
-
"class_mappings": {
|
| 83 |
-
"scene": {
|
| 84 |
-
"0": 16000001,
|
| 85 |
-
"1": 16000002,
|
| 86 |
-
"2": 16000006,
|
| 87 |
-
"3": 16000008,
|
| 88 |
-
"4": 16000009,
|
| 89 |
-
"5": 16000011
|
| 90 |
-
},
|
| 91 |
-
"concept": {
|
| 92 |
-
"0": 17000001,
|
| 93 |
-
"1": 17000002,
|
| 94 |
-
"2": 17000003
|
| 95 |
-
},
|
| 96 |
-
"object": {
|
| 97 |
-
"0": 18000001,
|
| 98 |
-
"1": 18000002,
|
| 99 |
-
"2": 18000004,
|
| 100 |
-
"3": 18000005,
|
| 101 |
-
"4": 18000006,
|
| 102 |
-
"5": 18000007,
|
| 103 |
-
"6": 18000008,
|
| 104 |
-
"7": 18000009,
|
| 105 |
-
"8": 18000010,
|
| 106 |
-
"9": 18000012,
|
| 107 |
-
"10": 18000014,
|
| 108 |
-
"11": 18000016,
|
| 109 |
-
"12": "unclassified"
|
| 110 |
-
}
|
| 111 |
-
}
|
| 112 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
preprocessor_config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"crop_size": {
|
| 3 |
+
"height": 224,
|
| 4 |
+
"width": 224
|
| 5 |
+
},
|
| 6 |
+
"do_center_crop": true,
|
| 7 |
+
"do_convert_rgb": true,
|
| 8 |
+
"do_normalize": true,
|
| 9 |
+
"do_rescale": true,
|
| 10 |
+
"do_resize": true,
|
| 11 |
+
"image_mean": [
|
| 12 |
+
0.485,
|
| 13 |
+
0.456,
|
| 14 |
+
0.406
|
| 15 |
+
],
|
| 16 |
+
"image_processor_type": "BitImageProcessor",
|
| 17 |
+
"image_std": [
|
| 18 |
+
0.229,
|
| 19 |
+
0.224,
|
| 20 |
+
0.225
|
| 21 |
+
],
|
| 22 |
+
"resample": 3,
|
| 23 |
+
"rescale_factor": 0.00392156862745098,
|
| 24 |
+
"size": {
|
| 25 |
+
"shortest_edge": 256
|
| 26 |
+
}
|
| 27 |
+
}
|