| Parameters: |
| ================================================================================================================================ |
| Name Shape Type Grad |
| input_layer.weight torch.Size([32, 1, 3, 3, 3]) torch.float32 True |
| input_layer.bias torch.Size([32]) torch.float32 True |
| blocks.0.norm1.weight torch.Size([32]) torch.float32 True |
| blocks.0.norm1.bias torch.Size([32]) torch.float32 True |
| blocks.0.norm2.weight torch.Size([32]) torch.float32 True |
| blocks.0.norm2.bias torch.Size([32]) torch.float32 True |
| blocks.0.conv1.weight torch.Size([32, 32, 3, 3, 3]) torch.float16 True |
| blocks.0.conv1.bias torch.Size([32]) torch.float16 True |
| blocks.0.conv2.weight torch.Size([32, 32, 3, 3, 3]) torch.float16 True |
| blocks.0.conv2.bias torch.Size([32]) torch.float16 True |
| blocks.1.norm1.weight torch.Size([32]) torch.float32 True |
| blocks.1.norm1.bias torch.Size([32]) torch.float32 True |
| blocks.1.norm2.weight torch.Size([32]) torch.float32 True |
| blocks.1.norm2.bias torch.Size([32]) torch.float32 True |
| blocks.1.conv1.weight torch.Size([32, 32, 3, 3, 3]) torch.float16 True |
| blocks.1.conv1.bias torch.Size([32]) torch.float16 True |
| blocks.1.conv2.weight torch.Size([32, 32, 3, 3, 3]) torch.float16 True |
| blocks.1.conv2.bias torch.Size([32]) torch.float16 True |
| blocks.2.conv.weight torch.Size([128, 32, 2, 2, 2]) torch.float16 True |
| blocks.2.conv.bias torch.Size([128]) torch.float16 True |
| blocks.3.norm1.weight torch.Size([128]) torch.float32 True |
| blocks.3.norm1.bias torch.Size([128]) torch.float32 True |
| blocks.3.norm2.weight torch.Size([128]) torch.float32 True |
| blocks.3.norm2.bias torch.Size([128]) torch.float32 True |
| blocks.3.conv1.weight torch.Size([128, 128, 3, 3, 3]) torch.float16 True |
| blocks.3.conv1.bias torch.Size([128]) torch.float16 True |
| blocks.3.conv2.weight torch.Size([128, 128, 3, 3, 3]) torch.float16 True |
| blocks.3.conv2.bias torch.Size([128]) torch.float16 True |
| blocks.4.norm1.weight torch.Size([128]) torch.float32 True |
| blocks.4.norm1.bias torch.Size([128]) torch.float32 True |
| blocks.4.norm2.weight torch.Size([128]) torch.float32 True |
| blocks.4.norm2.bias torch.Size([128]) torch.float32 True |
| blocks.4.conv1.weight torch.Size([128, 128, 3, 3, 3]) torch.float16 True |
| blocks.4.conv1.bias torch.Size([128]) torch.float16 True |
| blocks.4.conv2.weight torch.Size([128, 128, 3, 3, 3]) torch.float16 True |
| blocks.4.conv2.bias torch.Size([128]) torch.float16 True |
| blocks.5.conv.weight torch.Size([512, 128, 2, 2, 2]) torch.float16 True |
| blocks.5.conv.bias torch.Size([512]) torch.float16 True |
| blocks.6.norm1.weight torch.Size([512]) torch.float32 True |
| blocks.6.norm1.bias torch.Size([512]) torch.float32 True |
| blocks.6.norm2.weight torch.Size([512]) torch.float32 True |
| blocks.6.norm2.bias torch.Size([512]) torch.float32 True |
| blocks.6.conv1.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| blocks.6.conv1.bias torch.Size([512]) torch.float16 True |
| blocks.6.conv2.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| blocks.6.conv2.bias torch.Size([512]) torch.float16 True |
| blocks.7.norm1.weight torch.Size([512]) torch.float32 True |
| blocks.7.norm1.bias torch.Size([512]) torch.float32 True |
| blocks.7.norm2.weight torch.Size([512]) torch.float32 True |
| blocks.7.norm2.bias torch.Size([512]) torch.float32 True |
| blocks.7.conv1.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| blocks.7.conv1.bias torch.Size([512]) torch.float16 True |
| blocks.7.conv2.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| blocks.7.conv2.bias torch.Size([512]) torch.float16 True |
| middle_block.0.norm1.weight torch.Size([512]) torch.float32 True |
| middle_block.0.norm1.bias torch.Size([512]) torch.float32 True |
| middle_block.0.norm2.weight torch.Size([512]) torch.float32 True |
| middle_block.0.norm2.bias torch.Size([512]) torch.float32 True |
| middle_block.0.conv1.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| middle_block.0.conv1.bias torch.Size([512]) torch.float16 True |
| middle_block.0.conv2.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| middle_block.0.conv2.bias torch.Size([512]) torch.float16 True |
| middle_block.1.norm1.weight torch.Size([512]) torch.float32 True |
| middle_block.1.norm1.bias torch.Size([512]) torch.float32 True |
| middle_block.1.norm2.weight torch.Size([512]) torch.float32 True |
| middle_block.1.norm2.bias torch.Size([512]) torch.float32 True |
| middle_block.1.conv1.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| middle_block.1.conv1.bias torch.Size([512]) torch.float16 True |
| middle_block.1.conv2.weight torch.Size([512, 512, 3, 3, 3]) torch.float16 True |
| middle_block.1.conv2.bias torch.Size([512]) torch.float16 True |
| out_layer.0.weight torch.Size([512]) torch.float32 True |
| out_layer.0.bias torch.Size([512]) torch.float32 True |
| out_layer.2.weight torch.Size([16, 512, 3, 3, 3]) torch.float32 True |
| out_layer.2.bias torch.Size([16]) torch.float32 True |
|
|
| Number of parameters: 59298192 |
| Number of trainable parameters: 59298192 |
|
|
|
|