| { | |
| "model_type": "anycalib_ray_head", | |
| "source_model": "anycalib_gen", | |
| "description": "AnyCalib ray prediction head (backbone + decoder + head). Calibrator (RANSAC + Gauss-Newton) must run in post-processing.", | |
| "input": { | |
| "name": "image", | |
| "shape": [ | |
| "batch", | |
| 3, | |
| 518, | |
| 518 | |
| ], | |
| "dtype": "float32", | |
| "range": [ | |
| 0.0, | |
| 1.0 | |
| ], | |
| "color": "RGB" | |
| }, | |
| "outputs": [ | |
| { | |
| "name": "rays", | |
| "shape": [ | |
| "batch", | |
| 3, | |
| 518, | |
| 518 | |
| ], | |
| "dtype": "float32" | |
| }, | |
| { | |
| "name": "tangent_coords", | |
| "shape": [ | |
| "batch", | |
| 2, | |
| 518, | |
| 518 | |
| ], | |
| "dtype": "float32" | |
| } | |
| ], | |
| "architecture": { | |
| "backbone": "DINOv2 ViT-L/14 (304M params)", | |
| "decoder": "LightDPT (15.2M params)", | |
| "head": "ConvexTangentDecoder (0.6M params)", | |
| "total_params": "~320M" | |
| }, | |
| "variants": { | |
| "fp32": "1222.0 MB", | |
| "fp16": "611.3 MB", | |
| "int8": "311.1 MB" | |
| }, | |
| "opset_version": 17, | |
| "edge_divisible_by": 14, | |
| "recommended_input_size": 518 | |
| } |