DavidHiggis
commit
66af79e
-
1.34 kB
commit
decoder.pt
Detected Pickle imports (542)
- "collections.OrderedDict",
- "torch.DoubleStorage",
- "torch.LongStorage",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1139.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_998.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1227.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_966.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1079.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_838.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1206.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_977.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1099.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1120.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_818.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1187.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_830.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_856.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DalleBartDecoder",
- "__torch__.torch.nn.modules.linear.___torch_mangle_995.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_739.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1125.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1191.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_970.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1156.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_810.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_945.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_917.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_909.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1021.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_881.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_898.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_765.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_984.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1025.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1028.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_844.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1100.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1161.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1222.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1067.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_939.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_791.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1089.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_761.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_843.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1166.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1009.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_867.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_740.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1087.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1114.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1159.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_798.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_822.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_918.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1054.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1070.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1207.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1134.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_826.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_816.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1143.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_938.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1072.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1163.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_896.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_831.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_778.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_805.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_947.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1181.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_952.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_746.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_882.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_780.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1199.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1037.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_729.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1241.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_797.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1239.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_833.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1214.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_806.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1076.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1215.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_959.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1020.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1026.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_885.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_809.DecoderLayer",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1044.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_811.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1066.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1226.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_731.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1105.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1113.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1030.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_727.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1069.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1218.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_859.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1126.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1137.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1252.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1043.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1177.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1005.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_942.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1073.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_872.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1104.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1154.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1046.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_969.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_991.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1018.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1122.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1160.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_793.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_769.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_920.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_871.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_933.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_963.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1217.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1186.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_976.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_983.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1194.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_979.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1127.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_728.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1167.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1039.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1041.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1107.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_764.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_825.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_987.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_910.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_967.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1111.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_953.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_981.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1133.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1023.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1052.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1098.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_923.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_887.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_821.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_894.Linear",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_724.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1151.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1010.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_974.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_852.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_758.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1138.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_873.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1129.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_752.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_772.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_750.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_921.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_985.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_733.Linear",
- "torch.FloatStorage",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_756.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_962.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_808.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_763.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_851.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_870.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_960.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1002.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1110.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1056.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_891.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_824.GELU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_875.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_730.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1077.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_861.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_774.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_847.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_817.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1065.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_828.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1032.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_784.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1213.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1109.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1068.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1091.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1022.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1150.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1011.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_949.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1040.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_737.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_785.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1140.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_745.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_827.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_848.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1204.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1006.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_807.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1016.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1209.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1145.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1229.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_907.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_814.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_839.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_782.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_864.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1182.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1096.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_927.LayerNorm",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1085.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1001.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1173.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1084.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_900.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1034.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_773.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1108.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1119.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1200.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_874.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_940.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1094.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_862.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1220.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1017.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_889.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1082.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_877.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_916.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1136.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_878.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_837.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_813.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1170.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1036.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1027.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_767.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1062.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1179.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_928.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1211.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1243.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1171.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1158.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1175.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1123.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_799.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_993.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1103.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1228.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1118.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1080.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_863.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_869.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_832.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_893.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1189.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1007.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_911.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_915.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1253.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1130.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_904.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1248.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_812.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_735.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1247.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1059.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_884.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_880.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1090.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_926.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1093.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_845.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1015.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1049.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_738.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1202.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1251.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_777.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1149.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1236.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_781.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1174.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_968.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_835.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_753.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_754.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_787.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_760.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_899.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1075.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1176.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1201.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_796.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1212.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1064.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1219.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_905.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_801.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1196.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1232.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1148.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_747.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_989.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1244.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_971.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1000.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1188.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_854.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_941.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_925.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1048.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_913.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1029.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1095.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1038.Linear",
- "__torch__.torch.nn.modules.container.___torch_mangle_1250.ModuleList",
- "__torch__.torch.nn.modules.linear.___torch_mangle_895.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1083.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_986.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_836.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_749.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1165.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1178.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_742.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_736.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_901.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_888.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1106.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1058.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_849.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1142.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_829.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_741.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1012.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1033.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_919.DecoderLayer",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_723.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_776.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_964.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_943.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1245.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1249.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_858.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_759.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1053.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_866.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1164.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1234.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_815.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1153.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_936.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_957.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1031.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_950.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1081.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_795.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_912.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_930.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_994.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_794.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1088.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_868.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_841.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1162.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1168.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1074.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1223.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1146.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_857.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1240.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_755.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_842.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1183.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1128.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1061.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_757.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_732.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_890.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_886.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1112.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1203.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1210.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_876.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_865.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_965.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1135.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1233.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1221.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_922.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1231.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1184.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_779.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1035.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_955.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_929.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_792.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1216.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1045.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1230.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1152.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1197.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1060.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_743.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1124.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_982.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_789.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_766.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1024.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1102.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_823.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1055.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_768.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_961.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1198.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1235.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1003.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1047.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_975.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1092.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_956.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_783.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_775.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1042.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_804.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1169.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_879.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1238.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_853.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1013.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_770.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1116.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_931.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1131.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_744.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_946.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1225.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_897.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1147.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_800.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_903.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1172.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1097.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1019.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_935.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1057.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_855.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_973.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1192.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1004.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1141.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_980.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_999.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_944.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_992.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_850.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_996.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_978.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1237.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_990.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_924.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1063.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_771.DecoderSelfAttention",
- "__torch__.torch.nn.modules.activation.___torch_mangle_934.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_819.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1190.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1246.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_948.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1144.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_972.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_958.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_802.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_748.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_790.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1050.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_726.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_803.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_908.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1115.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1185.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_997.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_937.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1193.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_860.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1205.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_786.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_751.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_840.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_906.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1242.GELU",
- "collections.OrderedDict",
- "__torch__.torch.nn.modules.linear.___torch_mangle_834.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_954.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_902.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_951.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1014.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1121.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1155.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_725.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1157.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1195.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_846.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_892.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1101.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_914.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1117.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1224.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_762.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_883.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_788.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1208.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1086.DecoderCrossAttention",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1132.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1180.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_988.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_932.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1071.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_734.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1078.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1008.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1051.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_820.Linear"
How to fix it?
5.48 GB
commit
decoder_fp16.pt
Detected Pickle imports (542)
- "collections.OrderedDict",
- "torch.DoubleStorage",
- "torch.LongStorage",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1139.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_998.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1227.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_966.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1079.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_838.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1206.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_977.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1099.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1120.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_818.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1187.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_830.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_856.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DalleBartDecoder",
- "__torch__.torch.nn.modules.linear.___torch_mangle_995.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_739.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1125.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1191.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_970.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1156.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_810.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_945.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_917.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_909.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1021.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_881.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_898.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_765.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_984.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1025.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1028.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_844.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1100.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1161.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1222.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1067.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_939.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_791.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1089.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_761.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_843.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1166.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1009.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_867.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_740.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1087.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1114.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1159.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_798.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_822.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_918.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1054.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1070.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1207.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1134.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_826.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_816.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1143.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_938.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1072.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1163.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_896.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_831.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_778.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_805.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_947.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1181.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_952.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_746.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_882.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_780.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1199.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1037.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_729.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1241.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_797.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1239.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_833.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1214.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_806.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1076.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1215.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_959.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1020.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1026.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_885.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_809.DecoderLayer",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1044.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_811.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1066.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1226.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_731.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1105.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1113.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1030.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_727.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1069.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1218.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_859.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1126.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1137.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1252.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1043.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1177.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1005.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_942.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1073.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_872.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1104.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1154.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1046.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_969.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_991.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1018.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1122.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1160.GLU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_793.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_769.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_920.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_871.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_933.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_963.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1217.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1186.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_976.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_983.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1194.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_979.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1127.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_728.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1167.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1039.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1041.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1107.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_764.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_825.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_987.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_910.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_967.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1111.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_953.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_981.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1133.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1023.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1052.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1098.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_923.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_887.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_821.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_894.Linear",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_724.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1151.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1010.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_974.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_852.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_758.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1138.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_873.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1129.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_752.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_772.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_750.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_921.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_985.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_733.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_756.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_962.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_808.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_763.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_851.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_870.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_960.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1002.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1110.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1056.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_891.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_824.GELU",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_875.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_730.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1077.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_861.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_774.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_847.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_817.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1065.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_828.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1032.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_784.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1213.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1109.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1068.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1091.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1022.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1150.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1011.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_949.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1040.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_737.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_785.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1140.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_745.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_827.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_848.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1204.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1006.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_807.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1016.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1209.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1145.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1229.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_907.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_814.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_839.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_782.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_864.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1182.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1096.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_927.LayerNorm",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1085.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1001.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1173.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1084.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_900.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1034.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_773.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1108.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1119.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1200.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_874.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_940.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1094.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_862.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1220.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1017.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_889.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1082.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_877.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_916.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1136.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_878.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_837.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_813.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1170.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1036.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1027.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_767.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1062.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1179.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_928.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1211.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1243.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1171.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1158.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1175.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1123.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_799.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_993.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1103.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1228.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1118.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1080.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_863.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_869.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_832.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_893.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1189.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1007.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_911.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_915.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1253.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1130.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_904.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1248.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_812.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_735.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1247.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1059.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_884.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_880.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1090.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_926.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1093.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_845.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1015.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1049.Linear",
- "torch.HalfStorage",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_738.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1202.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1251.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_777.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1149.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1236.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_781.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1174.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_968.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_835.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_753.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_754.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_787.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_760.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_899.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1075.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1176.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1201.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_796.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1212.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1064.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1219.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_905.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_801.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1196.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1232.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1148.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_747.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_989.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1244.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_971.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1000.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1188.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_854.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_941.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_925.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1048.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_913.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1029.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1095.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1038.Linear",
- "__torch__.torch.nn.modules.container.___torch_mangle_1250.ModuleList",
- "__torch__.torch.nn.modules.linear.___torch_mangle_895.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1083.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_986.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_836.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_749.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1165.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1178.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_742.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_736.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_901.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_888.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1106.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1058.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_849.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1142.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_829.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_741.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1012.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1033.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_919.DecoderLayer",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_723.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_776.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_964.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_943.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1245.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1249.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_858.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_759.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1053.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_866.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1164.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1234.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_815.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1153.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_936.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_957.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1031.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_950.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1081.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_795.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_912.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_930.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_994.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_794.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1088.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_868.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_841.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1162.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1168.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1074.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1223.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1146.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_857.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1240.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_755.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_842.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1183.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1128.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1061.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_757.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_732.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_890.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_886.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1112.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1203.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1210.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_876.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_865.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_965.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1135.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1233.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1221.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_922.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1231.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1184.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_779.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1035.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_955.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_929.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_792.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1216.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1045.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1230.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1152.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1197.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1060.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_743.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1124.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_982.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_789.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_766.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1024.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1102.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_823.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1055.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_768.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_961.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1198.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1235.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1003.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1047.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_975.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1092.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_956.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_783.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_775.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1042.DecoderCrossAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_804.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1169.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_879.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1238.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_853.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1013.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_770.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1116.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_931.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1131.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_744.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_946.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1225.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_897.DecoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1147.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_800.DecoderCrossAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_903.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1172.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1097.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1019.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_935.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1057.DecoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_855.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_973.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1192.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1004.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1141.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_980.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_999.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_944.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_992.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_850.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_996.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_978.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1237.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_990.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_924.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1063.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_771.DecoderSelfAttention",
- "__torch__.torch.nn.modules.activation.___torch_mangle_934.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_819.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1190.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1246.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_948.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1144.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_972.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_958.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_802.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_748.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_790.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_1050.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_726.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_803.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_908.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1115.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1185.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_997.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_937.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1193.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_860.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1205.DecoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_786.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_751.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_840.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_906.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1242.GELU",
- "collections.OrderedDict",
- "__torch__.torch.nn.modules.linear.___torch_mangle_834.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.DecoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_954.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_902.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_951.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1014.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1121.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1155.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_725.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1157.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1195.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_846.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_892.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1101.DecoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_914.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1117.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1224.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_762.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_883.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_788.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1208.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1086.DecoderCrossAttention",
- "__torch__.torch.nn.modules.activation.___torch_mangle_1132.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1180.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_988.Linear",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_932.DecoderCrossAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1071.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_734.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1078.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_1008.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_decoder.___torch_mangle_1051.DecoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_820.Linear"
How to fix it?
2.72 GB
commit
encoder.pt
Detected Pickle imports (373)
- "collections.OrderedDict",
- "torch.DoubleStorage",
- "torch.LongStorage",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_284.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_313.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_55.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_245.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_72.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_318.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_223.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_235.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_247.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_339.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_84.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_134.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_296.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_83.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_222.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_182.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_77.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_232.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_329.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_185.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_20.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_196.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_103.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_208.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_188.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_62.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_13.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_45.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_199.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_128.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_90.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_298.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_147.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_295.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_65.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_119.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_299.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_176.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_321.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_309.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_125.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_261.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_190.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_122.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_281.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_327.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_267.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_117.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_343.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_76.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_219.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_262.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_97.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_289.LayerNorm",
- "__torch__.torch.nn.modules.linear.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_127.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_234.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_314.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_116.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_203.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_341.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_67.Linear",
- "__torch__.torch.nn.modules.activation.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_233.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_166.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_53.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_143.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_349.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_212.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_260.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_41.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_152.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_68.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_11.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_275.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_37.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_99.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_172.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_50.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_237.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_347.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_336.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_131.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_259.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_89.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_111.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_333.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_30.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_28.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_33.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_2.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_246.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_79.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_49.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_137.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_52.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_175.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_167.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_227.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_302.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_355.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_57.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_141.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_189.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_150.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_183.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_78.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_292.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_197.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_285.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_80.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_35.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_334.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_204.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_133.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_178.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_220.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_276.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_338.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_180.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_205.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_132.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_24.EncoderLayer",
- "torch.FloatStorage",
- "__torch__.torch.nn.modules.linear.___torch_mangle_27.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_93.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_326.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_5.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_323.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_217.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_301.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_311.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_86.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_8.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_170.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_192.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_215.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_310.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_26.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_257.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_96.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_258.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_230.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_213.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_201.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_335.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_312.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_348.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_211.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_154.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_238.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_101.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_270.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_9.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_202.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_138.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_291.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_66.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_82.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_159.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_136.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_324.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_42.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_174.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_305.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_332.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_187.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_15.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_322.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_229.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_47.GELU",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_179.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_115.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_7.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_209.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_320.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_315.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_225.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_113.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_19.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_88.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_337.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_356.LayerNorm",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_0.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_200.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_195.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_158.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_63.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_268.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_46.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_54.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_94.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_118.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_193.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_110.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_173.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_352.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_130.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_344.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_71.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_171.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_22.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_87.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_279.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_250.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_346.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_48.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_186.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_153.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_144.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_6.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_241.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_177.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_104.Linear",
- "__torch__.torch.nn.modules.container.ModuleList",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_226.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_274.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_236.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_308.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_34.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_69.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_85.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_157.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_243.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_140.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_92.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_124.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_354.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_255.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_294.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_252.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_263.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_303.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_149.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.DalleBartEncoder",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_160.LayerNorm",
- "__torch__.torch.nn.modules.normalization.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_109.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_282.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_73.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_286.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_306.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_135.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_216.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_342.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_228.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_288.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_23.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_44.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_319.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_293.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_25.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_12.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_102.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_155.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_139.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_36.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_214.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_249.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_210.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_307.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_91.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_105.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_31.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_146.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_17.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_287.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_345.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_40.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_248.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_112.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_300.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_81.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_304.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_278.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_129.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_39.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_114.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_218.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_16.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_61.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_181.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_60.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_231.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_21.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_4.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_95.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_43.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_198.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_273.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_184.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_239.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_123.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_206.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_106.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_126.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_244.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_283.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_316.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_3.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_240.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_297.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_151.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_271.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_290.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_251.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_272.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_266.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_242.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_56.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_70.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_161.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_265.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_75.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_120.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_351.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_191.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_277.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_51.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_58.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_331.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_108.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_253.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_256.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_317.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_168.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_74.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_164.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_350.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_18.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_14.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_330.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_142.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_254.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_156.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_100.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_121.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_169.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_98.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_145.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_280.LayerNorm",
- "__torch__.torch.nn.modules.sparse.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_59.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_328.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_207.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_162.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_224.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_340.LayerNorm",
- "collections.OrderedDict",
- "__torch__.torch.nn.modules.linear.___torch_mangle_148.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_165.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_353.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_107.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_32.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_264.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_64.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_269.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_325.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_221.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_29.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_194.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_10.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_38.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_163.Linear"
How to fix it?
4.12 GB
commit
encoder_fp16.pt
Detected Pickle imports (373)
- "collections.OrderedDict",
- "torch.DoubleStorage",
- "torch.LongStorage",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_284.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_313.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_55.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_245.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_72.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_318.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_223.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_235.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_247.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_339.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_84.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_134.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_296.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_83.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_222.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_182.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_77.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_232.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_329.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_185.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_20.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_196.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_103.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_208.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_188.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_62.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_13.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_45.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_199.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_128.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_90.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_298.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_147.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_295.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_65.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_119.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_299.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_176.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_321.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_309.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_125.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_261.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_190.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_122.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_281.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_327.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_267.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_117.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_343.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_76.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_219.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_262.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_97.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_289.LayerNorm",
- "__torch__.torch.nn.modules.linear.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_127.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_234.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_314.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_116.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_203.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_341.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_67.Linear",
- "__torch__.torch.nn.modules.activation.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_233.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_166.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_53.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_143.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_349.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_212.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_260.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_41.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_152.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_68.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_11.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_275.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_37.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_99.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_172.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_50.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_237.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_347.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_336.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_131.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_259.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_89.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_111.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_333.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_30.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_28.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_33.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_2.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_246.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_79.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_49.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_137.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_52.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_175.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_167.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_227.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_302.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_355.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_57.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_141.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_189.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_150.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_183.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_78.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_292.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_197.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_285.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_80.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_35.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_334.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_204.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_133.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_178.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_220.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_276.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_338.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_180.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_205.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_132.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_24.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_27.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_93.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_326.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_5.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_323.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_217.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_301.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_311.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_86.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_8.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_170.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_192.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_215.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_310.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_26.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_257.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_96.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_258.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_230.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_213.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_201.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_335.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_312.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_348.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_211.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_154.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_238.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_101.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_270.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_9.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_202.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_138.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_291.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_66.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_82.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_159.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_136.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_324.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_42.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_174.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_305.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_332.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_187.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_15.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_322.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_229.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_47.GELU",
- "torch._utils._rebuild_tensor_v2",
- "__torch__.torch.nn.modules.linear.___torch_mangle_179.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_115.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_7.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_209.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_320.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_315.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_225.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_113.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_19.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_88.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_337.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_356.LayerNorm",
- "__torch__.torch.nn.modules.sparse.___torch_mangle_0.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_200.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_195.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_158.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_63.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_268.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_46.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_54.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_94.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_118.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_193.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_110.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_173.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_352.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_130.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_344.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_71.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_171.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_22.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_87.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_279.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_250.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_346.LayerNorm",
- "torch.HalfStorage",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_48.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_186.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_153.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_144.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_6.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_241.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_177.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_104.Linear",
- "__torch__.torch.nn.modules.container.ModuleList",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_226.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_274.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_236.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_308.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_34.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_69.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_85.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_157.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_243.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_140.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_92.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_124.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_354.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_255.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_294.EncoderLayer",
- "__torch__.torch.nn.modules.linear.___torch_mangle_252.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_263.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_303.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_149.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.DalleBartEncoder",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_160.LayerNorm",
- "__torch__.torch.nn.modules.normalization.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_109.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_282.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_73.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_286.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_306.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_135.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_216.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_342.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_228.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_288.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_23.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_44.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_319.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_293.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_25.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_12.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_102.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_155.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_139.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_36.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_214.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_249.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_210.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_307.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_91.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_105.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_31.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_146.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_17.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_287.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_345.EncoderSelfAttention",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_40.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_248.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_112.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_300.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_81.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_304.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_278.GLU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_129.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_39.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_114.EncoderLayer",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_218.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_16.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_61.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_181.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_1.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_60.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_231.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_21.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_4.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_95.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_43.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_198.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_273.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_184.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_239.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_123.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_206.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_106.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_126.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_244.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_283.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_316.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_3.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_240.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_297.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_151.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_271.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_290.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_251.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_272.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_266.Linear",
- "__torch__.torch.nn.modules.activation.___torch_mangle_242.GELU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_56.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_70.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_161.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_265.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_75.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_120.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_351.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_191.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_277.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_51.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_58.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_331.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_108.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_253.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_256.LayerNorm",
- "__torch__.torch.nn.modules.activation.___torch_mangle_317.GELU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_168.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_74.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_164.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_350.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_18.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_14.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_330.EncoderSelfAttention",
- "__torch__.torch.nn.modules.linear.___torch_mangle_142.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_254.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_156.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_100.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_121.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_169.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_98.GLU",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_145.LayerNorm",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_280.LayerNorm",
- "__torch__.torch.nn.modules.sparse.Embedding",
- "__torch__.torch.nn.modules.linear.___torch_mangle_59.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_328.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_207.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_162.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_224.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_340.LayerNorm",
- "collections.OrderedDict",
- "__torch__.torch.nn.modules.linear.___torch_mangle_148.Linear",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_165.EncoderSelfAttention",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_353.GLU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_107.GELU",
- "__torch__.torch.nn.modules.activation.___torch_mangle_32.GELU",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_264.EncoderLayer",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_64.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_269.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_325.LayerNorm",
- "__torch__.torch.nn.modules.linear.___torch_mangle_221.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_29.Linear",
- "__torch__.torch.nn.modules.linear.___torch_mangle_194.Linear",
- "__torch__.torch.nn.modules.normalization.___torch_mangle_10.LayerNorm",
- "__torch__.min_dalle.models.dalle_bart_encoder.___torch_mangle_38.GLU",
- "__torch__.torch.nn.modules.linear.___torch_mangle_163.Linear"
How to fix it?
2.05 GB
commit
-
461 kB
commit
-
802 kB
commit