Scone / ae_metadata.json
Ryann829's picture
Upload folder using huggingface_hub
b8e4e54 verified
{
"decoder.conv_in.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.conv_in.weight": {
"shape": [
512,
16,
3,
3
],
"dtype": "torch.float32"
},
"decoder.conv_out.bias": {
"shape": [
3
],
"dtype": "torch.float32"
},
"decoder.conv_out.weight": {
"shape": [
3,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.k.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.k.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.norm.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.norm.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.proj_out.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.proj_out.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.q.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.q.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.v.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.attn_1.v.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.mid.block_2.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.norm_out.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.norm_out.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.conv1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.conv1.weight": {
"shape": [
128,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.conv2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.conv2.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.nin_shortcut.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.nin_shortcut.weight": {
"shape": [
128,
256,
1,
1
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.norm1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.norm1.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.norm2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.0.norm2.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.conv1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.conv1.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.conv2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.conv2.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.norm1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.norm1.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.norm2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.1.norm2.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.conv1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.conv1.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.conv2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.conv2.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.norm1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.norm1.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.norm2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.0.block.2.norm2.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.conv1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.conv1.weight": {
"shape": [
256,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.conv2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.conv2.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.nin_shortcut.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.nin_shortcut.weight": {
"shape": [
256,
512,
1,
1
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.norm2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.0.norm2.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.conv1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.conv1.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.conv2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.conv2.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.norm1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.norm1.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.norm2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.1.norm2.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.conv1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.conv1.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.conv2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.conv2.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.norm1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.norm1.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.norm2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.block.2.norm2.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.upsample.conv.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"decoder.up.1.upsample.conv.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.0.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.block.2.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.upsample.conv.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.2.upsample.conv.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.0.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.block.2.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.upsample.conv.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"decoder.up.3.upsample.conv.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.conv_in.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.conv_in.weight": {
"shape": [
128,
3,
3,
3
],
"dtype": "torch.float32"
},
"encoder.conv_out.bias": {
"shape": [
32
],
"dtype": "torch.float32"
},
"encoder.conv_out.weight": {
"shape": [
32,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.conv1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.conv1.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.conv2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.conv2.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.norm1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.norm1.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.norm2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.0.norm2.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.conv1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.conv1.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.conv2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.conv2.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.norm1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.norm1.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.norm2.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.block.1.norm2.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.downsample.conv.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.0.downsample.conv.weight": {
"shape": [
128,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.conv1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.conv1.weight": {
"shape": [
256,
128,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.conv2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.conv2.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.nin_shortcut.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.nin_shortcut.weight": {
"shape": [
256,
128,
1,
1
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.norm1.bias": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.norm1.weight": {
"shape": [
128
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.norm2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.0.norm2.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.conv1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.conv1.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.conv2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.conv2.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.norm1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.norm1.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.norm2.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.block.1.norm2.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.downsample.conv.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.1.downsample.conv.weight": {
"shape": [
256,
256,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.conv1.weight": {
"shape": [
512,
256,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.nin_shortcut.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.nin_shortcut.weight": {
"shape": [
512,
256,
1,
1
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.norm1.bias": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.norm1.weight": {
"shape": [
256
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.0.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.block.1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.downsample.conv.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.2.downsample.conv.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.0.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.down.3.block.1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.k.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.k.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.norm.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.norm.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.proj_out.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.proj_out.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.q.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.q.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.v.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.attn_1.v.weight": {
"shape": [
512,
512,
1,
1
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_1.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.conv1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.conv1.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.conv2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.conv2.weight": {
"shape": [
512,
512,
3,
3
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.norm1.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.norm1.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.norm2.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.mid.block_2.norm2.weight": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.norm_out.bias": {
"shape": [
512
],
"dtype": "torch.float32"
},
"encoder.norm_out.weight": {
"shape": [
512
],
"dtype": "torch.float32"
}
}