| { |
| "architectures": [ |
| "OpticalFlowPerceiver" |
| ], |
| "model_config": { |
| "activation_checkpointing": false, |
| "activation_offloading": false, |
| "decoder": { |
| "cross_attention_residual": false, |
| "cross_attention_widening_factor": 1, |
| "dropout": 0.1, |
| "freeze": false, |
| "image_shape": [ |
| 368, |
| 496 |
| ], |
| "init_scale": 0.02, |
| "num_cross_attention_heads": 1, |
| "num_cross_attention_qk_channels": 512, |
| "num_cross_attention_v_channels": 512, |
| "rescale_factor": 100.0 |
| }, |
| "encoder": { |
| "cross_attention_widening_factor": 1, |
| "dropout": 0.1, |
| "first_cross_attention_layer_shared": false, |
| "first_self_attention_block_shared": true, |
| "freeze": false, |
| "image_shape": [ |
| 368, |
| 496 |
| ], |
| "init_scale": 0.02, |
| "num_cross_attention_heads": 1, |
| "num_cross_attention_layers": 1, |
| "num_cross_attention_qk_channels": null, |
| "num_cross_attention_v_channels": null, |
| "num_frequency_bands": 64, |
| "num_patch_hidden_channels": 64, |
| "num_patch_input_channels": 27, |
| "num_self_attention_blocks": 1, |
| "num_self_attention_heads": 16, |
| "num_self_attention_layers_per_block": 24, |
| "num_self_attention_qk_channels": null, |
| "num_self_attention_v_channels": null, |
| "self_attention_widening_factor": 1 |
| }, |
| "num_latent_channels": 512, |
| "num_latents": 2048 |
| }, |
| "model_type": "perceiver-io-optical-flow", |
| "torch_dtype": "float32", |
| "transformers_version": "4.28.0" |
| } |
|
|