File size: 6,774 Bytes
7b932f9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
{
    "module": "keras_hub.src.models.sam3.sam3_pc_backbone",
    "class_name": "SAM3PromptableConceptBackbone",
    "config": {
        "name": "sam3_promptable_concept_backbone",
        "trainable": true,
        "dtype": {
            "module": "keras",
            "class_name": "DTypePolicy",
            "config": {
                "name": "float32"
            },
            "registered_name": null
        },
        "vision_encoder": {
            "module": "keras_hub.src.models.sam3.sam3_vision_encoder",
            "class_name": "SAM3VisionEncoder",
            "config": {
                "name": "sam3_vision_encoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "image_shape": [
                    1008,
                    1008,
                    3
                ],
                "patch_size": 14,
                "num_layers": 32,
                "hidden_dim": 1024,
                "intermediate_dim": 4736,
                "num_heads": 16,
                "fpn_hidden_dim": 256,
                "fpn_scale_factors": [
                    4.0,
                    2.0,
                    1.0,
                    0.5
                ],
                "pretrain_image_shape": [
                    336,
                    336,
                    3
                ],
                "hidden_activation": "gelu",
                "rope_theta": 10000.0,
                "window_size": 24,
                "global_attn_indexes": [
                    7,
                    15,
                    23,
                    31
                ],
                "attention_dropout_rate": 0.0,
                "hidden_dropout_rate": 0.0,
                "layer_norm_epsilon": 1e-06
            },
            "registered_name": "keras_hub>SAM3VisionEncoder"
        },
        "text_encoder": {
            "module": "keras_hub.src.models.sam3.sam3_text_encoder",
            "class_name": "SAM3TextEncoder",
            "config": {
                "name": "sam3_text_encoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "vocabulary_size": 49408,
                "embedding_dim": 1024,
                "hidden_dim": 1024,
                "num_layers": 24,
                "num_heads": 16,
                "intermediate_dim": 4096,
                "intermediate_activation": "gelu",
                "max_sequence_length": 32,
                "layer_norm_epsilon": 1e-05
            },
            "registered_name": "keras_hub>SAM3TextEncoder"
        },
        "geometry_encoder": {
            "module": "keras_hub.src.models.sam3.sam3_geometry_encoder",
            "class_name": "SAM3GeometryEncoder",
            "config": {
                "name": "sam3_geometry_encoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "num_layers": 3,
                "hidden_dim": 256,
                "intermediate_dim": 2048,
                "num_heads": 8,
                "roi_size": 7,
                "hidden_activation": "relu",
                "dropout_rate": 0.0,
                "layer_norm_epsilon": 1e-06
            },
            "registered_name": "keras_hub>SAM3GeometryEncoder"
        },
        "detr_encoder": {
            "module": "keras_hub.src.models.sam3.sam3_detr_encoder",
            "class_name": "SAM3DetrEncoder",
            "config": {
                "name": "sam3_detr_encoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "num_layers": 6,
                "hidden_dim": 256,
                "intermediate_dim": 2048,
                "num_heads": 8,
                "hidden_activation": "relu",
                "dropout_rate": 0.1,
                "layer_norm_epsilon": 1e-06
            },
            "registered_name": "keras_hub>SAM3DetrEncoder"
        },
        "detr_decoder": {
            "module": "keras_hub.src.models.sam3.sam3_detr_decoder",
            "class_name": "SAM3DetrDecoder",
            "config": {
                "name": "sam3_detr_decoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "image_shape": [
                    1008,
                    1008,
                    3
                ],
                "patch_size": 14,
                "num_layers": 6,
                "hidden_dim": 256,
                "intermediate_dim": 2048,
                "num_heads": 8,
                "num_queries": 200,
                "hidden_activation": "relu",
                "dropout_rate": 0.1,
                "layer_norm_epsilon": 1e-06
            },
            "registered_name": "keras_hub>SAM3DetrDecoder"
        },
        "mask_decoder": {
            "module": "keras_hub.src.models.sam3.sam3_mask_decoder",
            "class_name": "SAM3MaskDecoder",
            "config": {
                "name": "sam3_mask_decoder",
                "trainable": true,
                "dtype": {
                    "module": "keras",
                    "class_name": "DTypePolicy",
                    "config": {
                        "name": "float32"
                    },
                    "registered_name": null
                },
                "num_upsampling_stages": 3,
                "hidden_dim": 256,
                "num_heads": 8,
                "dropout_rate": 0.0,
                "layer_norm_epsilon": 1e-06
            },
            "registered_name": "keras_hub>SAM3MaskDecoder"
        }
    },
    "registered_name": "keras_hub>SAM3PromptableConceptBackbone"
}