{
  "converter_version": 1,
  "model_id": "robbyant/lingbot-depth-pretrain-vitl-14-v0.5",
  "num_tokens_range": [
    1200,
    3600
  ],
  "patch_size": 14,
  "num_heads": 16,
  "embed_dim": 1024,
  "depth": 24,
  "remap_depth_in": "log",
  "remap_depth_out": "linear",
  "image_mean": [
    0.48500001430511475,
    0.4560000002384186,
    0.4059999883174896
  ],
  "image_std": [
    0.2290000021457672,
    0.2240000069141388,
    0.22499999403953552
  ],
  "neck": 1024
}