diff --git a/.cache/empty.txt b/.cache/empty.txt deleted file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..0000000000000000000000000000000000000000 diff --git a/.gitattributes b/.gitattributes index 086eeef60fb35297da68b8c842db1e0e338fd577..9920734790f3df3740765754c92c61d3e9f742df 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,348 +33,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text -libs/fmt.dll filter=lfs diff=lfs merge=lfs -text -libs/onnx_custom_ops.dll filter=lfs diff=lfs merge=lfs -text -libs/ryzen_mm.dll filter=lfs diff=lfs merge=lfs -text -libs/spdlog.dll filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_10.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_100.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_101.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_102.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_103.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_104.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_105.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_106.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_107.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_108.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_109.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_11.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_110.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_111.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_112.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_113.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_115.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_118.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_119.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_12.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_120.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_121.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_124.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_127.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_13.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_130.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_131.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_132.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_133.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_135.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_137.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_139.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_14.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_142.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_143.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_144.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_145.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_148.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_15.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_151.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_154.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_155.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_156.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_157.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_158.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_16.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_160.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_162.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_163.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_165.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_168.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_169.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_17.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_170.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_171.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_174.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_177.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_180.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_181.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_182.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_183.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_185.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_187.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_189.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_19.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_192.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_193.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_194.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_195.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_198.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_201.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_204.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_205.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_206.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_207.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_208.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_21.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_210.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_212.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_214.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_216.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_218.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_22.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_220.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_222.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_225.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_226.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_227.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_232.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_235.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_238.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_24.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_241.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_242.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_243.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_244.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_246.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_248.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_250.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_252.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_253.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_255.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_257.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_258.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_26.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_260.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_262.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_263.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_265.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_267.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_269.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_270.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_272.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_275.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_276.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_277.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_278.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_281.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_284.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_287.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_288.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_289.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_29.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_290.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_292.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_294.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_295.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_297.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_3.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_30.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_300.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_301.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_302.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_303.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_306.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_309.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_31.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_312.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_313.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_314.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_315.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_317.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_319.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_32.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_320.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_322.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_325.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_326.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_327.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_328.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_331.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_334.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_337.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_338.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_339.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_340.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_342.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_344.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_346.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_347.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_349.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_35.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_352.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_353.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_354.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_355.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_358.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_361.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_364.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_365.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_366.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_367.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_369.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_371.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_372.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_374.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_377.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_378.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_379.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_38.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_380.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_383.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_386.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_389.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_390.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_391.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_392.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_394.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_396.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_397.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_399.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_4.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_402.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_403.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_404.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_405.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_408.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_41.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_411.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_414.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_415.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_416.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_417.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_419.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_42.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_421.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_423.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_424.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_426.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_429.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_43.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_430.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_431.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_432.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_435.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_438.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_44.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_441.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_442.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_443.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_444.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_446.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_448.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_449.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_451.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_454.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_455.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_456.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_457.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_46.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_460.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_463.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_466.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_467.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_468.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_469.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_47.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_471.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_473.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_474.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_476.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_479.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_480.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_481.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_482.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_485.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_488.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_49.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_491.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_492.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_493.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_494.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_5.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_51.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_54.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_55.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_56.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_57.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_6.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_60.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_63.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_66.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_67.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_68.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_69.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_7.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_70.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_72.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_73.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_75.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_76.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_77.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_78.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_79.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_8.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_80.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_81.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_82.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_83.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_84.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_85.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_86.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_87.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_88.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_89.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_9.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_90.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_91.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_92.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_93.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_94.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_95.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_96.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_97.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_98.const filter=lfs diff=lfs merge=lfs -text -unet/.cache/NhwcConv_0-conv_inConv_99.const filter=lfs diff=lfs merge=lfs -text -unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt filter=lfs diff=lfs merge=lfs -text -unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst filter=lfs diff=lfs merge=lfs -text -unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state filter=lfs diff=lfs merge=lfs -text -unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_10.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_11.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_13.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_16.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_19.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_22.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_25.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_28.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_31.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_34.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_37.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_39.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_4.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_42.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_45.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_48.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_51.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_54.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_57.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_59.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_61.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_63.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_66.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_69.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_7.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_72.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_75.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_78.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_80.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_84.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_87.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_9.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_90.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_93.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_96.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/.cache/NhwcConv_0-post_quant_convConv_99.const filter=lfs diff=lfs merge=lfs -text -vae_decoder/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.ctrlpkt filter=lfs diff=lfs merge=lfs -text -vae_decoder/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.fconst filter=lfs diff=lfs merge=lfs -text -vae_decoder/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.state filter=lfs diff=lfs merge=lfs -text -vae_decoder/dd_metastate_Sd15_Decoder_NhwcConv_0-post_quant_convConv.super filter=lfs diff=lfs merge=lfs -text -ryzen-ai-end-user-license-agreement-public.pdf filter=lfs diff=lfs merge=lfs -text +*.ctrlpkt filter=lfs diff=lfs merge=lfs -text +*.fconst filter=lfs diff=lfs merge=lfs -text +*.state filter=lfs diff=lfs merge=lfs -text +*.super filter=lfs diff=lfs merge=lfs -text diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000000000000000000000000000000000000..928aa738f243e6df76ab3e91d4a2b81809da6d64 --- /dev/null +++ b/LICENSE @@ -0,0 +1,82 @@ +Copyright (c) 2022 Robin Rombach and Patrick Esser and contributors + +CreativeML Open RAIL-M +dated August 22, 2022 + +Section I: PREAMBLE + +Multimodal generative models are being widely adopted and used, and have the potential to transform the way artists, among other individuals, conceive and benefit from AI or ML technologies as a tool for content creation. + +Notwithstanding the current and potential benefits that these artifacts can bring to society at large, there are also concerns about potential misuses of them, either due to their technical limitations or ethical considerations. + +In short, this license strives for both the open and responsible downstream use of the accompanying model. When it comes to the open character, we took inspiration from open source permissive licenses regarding the grant of IP rights. Referring to the downstream responsible use, we added use-based restrictions not permitting the use of the Model in very specific scenarios, in order for the licensor to be able to enforce the license in case potential misuses of the Model may occur. At the same time, we strive to promote open and responsible research on generative models for art and content generation. + +Even though downstream derivative versions of the model could be released under different licensing terms, the latter will always have to include - at minimum - the same use-based restrictions as the ones in the original license (this license). We believe in the intersection between open and responsible AI development; thus, this License aims to strike a balance between both in order to enable responsible open-science in the field of AI. + +This License governs the use of the model (and its derivatives) and is informed by the model card associated with the model. + +NOW THEREFORE, You and Licensor agree as follows: + +1. Definitions + +- "License" means the terms and conditions for use, reproduction, and Distribution as defined in this document. +- "Data" means a collection of information and/or content extracted from the dataset used with the Model, including to train, pretrain, or otherwise evaluate the Model. The Data is not licensed under this License. +- "Output" means the results of operating a Model as embodied in informational content resulting therefrom. +- "Model" means any accompanying machine-learning based assemblies (including checkpoints), consisting of learnt weights, parameters (including optimizer states), corresponding to the model architecture as embodied in the Complementary Material, that have been trained or tuned, in whole or in part on the Data, using the Complementary Material. +- "Derivatives of the Model" means all modifications to the Model, works based on the Model, or any other model which is created or initialized by transfer of patterns of the weights, parameters, activations or output of the Model, to the other model, in order to cause the other model to perform similarly to the Model, including - but not limited to - distillation methods entailing the use of intermediate data representations or methods based on the generation of synthetic data by the Model for training the other model. +- "Complementary Material" means the accompanying source code and scripts used to define, run, load, benchmark or evaluate the Model, and used to prepare data for training or evaluation, if any. This includes any accompanying documentation, tutorials, examples, etc, if any. +- "Distribution" means any transmission, reproduction, publication or other sharing of the Model or Derivatives of the Model to a third party, including providing the Model as a hosted service made available by electronic or other remote means - e.g. API-based or web access. +- "Licensor" means the copyright owner or entity authorized by the copyright owner that is granting the License, including the persons or entities that may have rights in the Model and/or distributing the Model. +- "You" (or "Your") means an individual or Legal Entity exercising permissions granted by this License and/or making use of the Model for whichever purpose and in any field of use, including usage of the Model in an end-use application - e.g. chatbot, translator, image generator. +- "Third Parties" means individuals or legal entities that are not under common control with Licensor or You. +- "Contribution" means any work of authorship, including the original version of the Model and any modifications or additions to that Model or Derivatives of the Model thereof, that is intentionally submitted to Licensor for inclusion in the Model by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner. For the purposes of this definition, "submitted" means any form of electronic, verbal, or written communication sent to the Licensor or its representatives, including but not limited to communication on electronic mailing lists, source code control systems, and issue tracking systems that are managed by, or on behalf of, the Licensor for the purpose of discussing and improving the Model, but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as "Not a Contribution." +- "Contributor" means Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Model. + +Section II: INTELLECTUAL PROPERTY RIGHTS + +Both copyright and patent grants apply to the Model, Derivatives of the Model and Complementary Material. The Model and Derivatives of the Model are subject to additional terms as described in Section III. + +2. Grant of Copyright License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable copyright license to reproduce, prepare, publicly display, publicly perform, sublicense, and distribute the Complementary Material, the Model, and Derivatives of the Model. +3. Grant of Patent License. Subject to the terms and conditions of this License and where and as applicable, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable (except as stated in this paragraph) patent license to make, have made, use, offer to sell, sell, import, and otherwise transfer the Model and the Complementary Material, where such license applies only to those patent claims licensable by such Contributor that are necessarily infringed by their Contribution(s) alone or by combination of their Contribution(s) with the Model to which such Contribution(s) was submitted. If You institute patent litigation against any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Model and/or Complementary Material or a Contribution incorporated within the Model and/or Complementary Material constitutes direct or contributory patent infringement, then any patent licenses granted to You under this License for the Model and/or Work shall terminate as of the date such litigation is asserted or filed. + +Section III: CONDITIONS OF USAGE, DISTRIBUTION AND REDISTRIBUTION + +4. Distribution and Redistribution. You may host for Third Party remote access purposes (e.g. software-as-a-service), reproduce and distribute copies of the Model or Derivatives of the Model thereof in any medium, with or without modifications, provided that You meet the following conditions: +Use-based restrictions as referenced in paragraph 5 MUST be included as an enforceable provision by You in any type of legal agreement (e.g. a license) governing the use and/or distribution of the Model or Derivatives of the Model, and You shall give notice to subsequent users You Distribute to, that the Model or Derivatives of the Model are subject to paragraph 5. This provision does not apply to the use of Complementary Material. +You must give any Third Party recipients of the Model or Derivatives of the Model a copy of this License; +You must cause any modified files to carry prominent notices stating that You changed the files; +You must retain all copyright, patent, trademark, and attribution notices excluding those notices that do not pertain to any part of the Model, Derivatives of the Model. +You may add Your own copyright statement to Your modifications and may provide additional or different license terms and conditions - respecting paragraph 4.a. - for use, reproduction, or Distribution of Your modifications, or for any such Derivatives of the Model as a whole, provided Your use, reproduction, and Distribution of the Model otherwise complies with the conditions stated in this License. +5. Use-based restrictions. The restrictions set forth in Attachment A are considered Use-based restrictions. Therefore You cannot use the Model and the Derivatives of the Model for the specified restricted uses. You may use the Model subject to this License, including only for lawful purposes and in accordance with the License. Use may include creating any content with, finetuning, updating, running, training, evaluating and/or reparametrizing the Model. You shall require all of Your users who use the Model or a Derivative of the Model to comply with the terms of this paragraph (paragraph 5). +6. The Output You Generate. Except as set forth herein, Licensor claims no rights in the Output You generate using the Model. You are accountable for the Output you generate and its subsequent uses. No use of the output can contravene any provision as stated in the License. + +Section IV: OTHER PROVISIONS + +7. Updates and Runtime Restrictions. To the maximum extent permitted by law, Licensor reserves the right to restrict (remotely or otherwise) usage of the Model in violation of this License, update the Model through electronic means, or modify the Output of the Model based on updates. You shall undertake reasonable efforts to use the latest version of the Model. +8. Trademarks and related. Nothing in this License permits You to make use of Licensors’ trademarks, trade names, logos or to otherwise suggest endorsement or misrepresent the relationship between the parties; and any rights not expressly granted herein are reserved by the Licensors. +9. Disclaimer of Warranty. Unless required by applicable law or agreed to in writing, Licensor provides the Model and the Complementary Material (and each Contributor provides its Contributions) on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied, including, without limitation, any warranties or conditions of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are solely responsible for determining the appropriateness of using or redistributing the Model, Derivatives of the Model, and the Complementary Material and assume any risks associated with Your exercise of permissions under this License. +10. Limitation of Liability. In no event and under no legal theory, whether in tort (including negligence), contract, or otherwise, unless required by applicable law (such as deliberate and grossly negligent acts) or agreed to in writing, shall any Contributor be liable to You for damages, including any direct, indirect, special, incidental, or consequential damages of any character arising as a result of this License or out of the use or inability to use the Model and the Complementary Material (including but not limited to damages for loss of goodwill, work stoppage, computer failure or malfunction, or any and all other commercial damages or losses), even if such Contributor has been advised of the possibility of such damages. +11. Accepting Warranty or Additional Liability. While redistributing the Model, Derivatives of the Model and the Complementary Material thereof, You may choose to offer, and charge a fee for, acceptance of support, warranty, indemnity, or other liability obligations and/or rights consistent with this License. However, in accepting such obligations, You may act only on Your own behalf and on Your sole responsibility, not on behalf of any other Contributor, and only if You agree to indemnify, defend, and hold each Contributor harmless for any liability incurred by, or claims asserted against, such Contributor by reason of your accepting any such warranty or additional liability. +12. If any provision of this License is held to be invalid, illegal or unenforceable, the remaining provisions shall be unaffected thereby and remain valid as if such provision had not been set forth herein. + +END OF TERMS AND CONDITIONS + + + + +Attachment A + +Use Restrictions + +You agree not to use the Model or Derivatives of the Model: +- In any way that violates any applicable national, federal, state, local or international law or regulation; +- For the purpose of exploiting, harming or attempting to exploit or harm minors in any way; +- To generate or disseminate verifiably false information and/or content with the purpose of harming others; +- To generate or disseminate personal identifiable information that can be used to harm an individual; +- To defame, disparage or otherwise harass others; +- For fully automated decision making that adversely impacts an individual’s legal rights or otherwise creates or modifies a binding, enforceable obligation; +- For any use intended to or which has the effect of discriminating against or harming individuals or groups based on online or offline social behavior or known or predicted personal or personality characteristics; +- To exploit any of the vulnerabilities of a specific group of persons based on their age, social, physical or mental characteristics, in order to materially distort the behavior of a person pertaining to that group in a manner that causes or is likely to cause that person or another person physical or psychological harm; +- For any use intended to or which has the effect of discriminating against individuals or groups based on legally protected characteristics or categories; +- To provide medical advice and medical results interpretation; +- To generate or disseminate information for the purpose to be used for administration of justice, law enforcement, immigration or asylum processes, such as predicting an individual will commit fraud/crime commitment (e.g. by text profiling, drawing causal relationships between assertions made in documents, indiscriminate and arbitrarily-targeted use). \ No newline at end of file diff --git a/README.md b/README.md index 57accbf0d892adbc9b51038e28458f0bcea36cce..a0d1650d791d416935033725cf8dab975bef3b7f 100644 --- a/README.md +++ b/README.md @@ -1,70 +1,80 @@ --- +language: en license: creativeml-openrail-m +tags: +- stable-diffusion +- stable-diffusion-diffusers +- text-to-image +- RyzenAI +- Quantization +- ONNX +- Computer Vision +inference: true --- -# Image Generation NPU Models – SD 1.5 +# 🚀 Stable Diffusion 1.5 on AMD AI PC NPU -This repository contains the ONNX models and runtime libraries required to run the image generation pipeline on AMD NPUs. +"Stable Diffusion is a latent text-to-image diffusion model capable of generating photo-realistic images given any text input. For more information about how Stable Diffusion functions, please have a look at [🤗's Stable Diffusion blog](https://huggingface.co/blog/stable_diffusion)". +More details about this model can be found on the original Hugging Face model card: [stable-diffusion-v1-5/stable-diffusion-v1-5](https://huggingface.co/stable-diffusion-v1-5/stable-diffusion-v1-5). -The folder structure is organized to mirror the main components of the diffusion pipeline (UNet, VAE decoder, text encoder, tokenizer and scheduler), plus the platform-specific runtime libraries. +This model repo contains the optimized ONNX models required to run the image generation pipeline for Stable Diffusion 1.5 on AMD NPUs. ---- +## Model Details -## Repository structure +The folder structure is organized to mirror the main components of the diffusion pipeline (scheduler, text encoder, tokenizer, UNet, and VAE decoder). -``` -. -├─ libs/ +```text ├─ scheduler/ ├─ text_encoder/ ├─ tokenizer/ ├─ unet/ └─ vae_decoder/ ``` +The [scheduler](scheduler) folder contains the scheduler configuration (timesteps, betas, alphas, etc.) used during the diffusion sampling process. -### `libs/` -This folder contains the dynamic libraries (`.dll`) required at runtime by the NPU backend. -They must be placed in a location where the application can load them (e.g., in the same folder as the executable or in the system `PATH`). +The [text_encoder](text_encoder) folder contains the text encoder model used to convert the input prompt into conditioning embeddings for the diffusion model. -### `unet/` -This folder contains the UNet model used in the diffusion process. -The UNet is exported and structured specifically to leverage the AMD NPU accelerator for the denoising steps. +The [tokenizer](tokenizer) contains the tokenizer configuration and vocabulary files required to preprocess the text prompt before it is fed to the text encoder. -### `vae_decoder/` -This folder contains the VAE decoder model used to map latent representations back to the image space. -The VAE decoder is also structured to make use of the NPU accelerator for efficient image reconstruction. +The [unet](unet) folder contains the UNet model used in the diffusion process. The UNet is exported and structured specifically to leverage the AMD NPU accelerator for the denoising steps. -### `text_encoder/` -This folder contains the text encoder model used to convert the input prompt into conditioning embeddings for the diffusion model. +The [vae_decoder](vae_decoder) folder contains the VAE decoder model used to map latent representations back to the image space. The VAE decoder is also structured to make use of the NPU accelerator for efficient image reconstruction. -### `tokenizer/` -This folder contains the tokenizer configuration and vocabulary files required to preprocess the text prompt before it is fed to the text encoder. +> Note: UNet and VAE decoder models are optimized and structured to run on AMD NPUs. The other components (text encoder, tokenizer and scheduler) are shared between GPU and NPU pipelines, but are provided here for completeness. -### `scheduler/` -This folder contains the scheduler configuration (timesteps, betas, alphas, etc.) used during the diffusion sampling process. +| Model Details | Description | +| ----------- | ----------- | +| Person or organization developing model | [Giovanni Guasti (AMD)](https://huggingface.co/gguasti), [Benjamin Consolvo (AMD)](https://huggingface.co/bconsolvo) | +| Original model authors | [Robin Rombach](https://huggingface.co/rromb), [Patrick Esser](https://huggingface.co/pesser) | +| Model date | January 2026 | +| Model version | 1.7.0 | +| Model type | Diffusion-based text-to-image generation model | +| Information about training algorithms, parameters, fairness constraints or other applied approaches, and features | This is a model that can be used to generate and modify images based on text prompts. It is a [Latent Diffusion Model](https://arxiv.org/abs/2112.10752) that uses a fixed, pretrained text encoder ([CLIP ViT-L/14](https://arxiv.org/abs/2103.00020)) as suggested in the [Imagen paper](https://arxiv.org/abs/2205.11487). | +| License | [CreativeML OpenRAIL-M](LICENSE) | +| Where to send questions or comments about the model | [Community Tab](https://hf.co/amd/stable-diffusion-1.5-amdnpu/discussions) and [AMD Developer Community Discord](https://discord.gg/amd-dev) | ---- +## ⚡ Intended Use -## Release 1113 +#### Getting Started -This release corresponds to the **1113 build**. +To get started on with this model, visit [github.com/amd/sd-sandbox](https://github.com/amd/sd-sandbox). -**Included in this version:** -- Updated UNet and VAE Decoder models optimized for AMD NPU execution. -- Synchronized text encoder, tokenizer, and scheduler components aligned with the 1113 pipeline. -- Updated runtime DLLs in the `libs/` folder. -- Improved model folder structure for compatibility with Procyon and NPU execution environments. +## ⚓ Ethical Considerations -**Notes:** -- All ONNX models in this release are validated with the 1113 test package. -- Ensure that the DLLs from `libs/` are correctly placed in the application’s search path. -- This release is intended for NPU execution; GPU versions are hosted separately. +AMD is committed to conducting our business in a fair, ethical and honest manner and in compliance with all applicable laws, rules and regulations. You can find out more at the [AMD Ethics and Compliance](https://www.amd.com/en/corporate/corporate-responsibility/ethics-and-compliance.html) page. ---- +## ⚠️ Caveats and Recommendations -## Notes +Please visit the original model card for more details: [stable-diffusion-v1-5/stable-diffusion-v1-5](https://huggingface.co/stable-diffusion-v1-5/stable-diffusion-v1-5). -- UNet and VAE decoder models are optimized and structured to run on AMD NPUs. -- The other components (text encoder, tokenizer and scheduler) are shared between GPU and NPU pipelines, but are provided here for completeness. -- Please refer to the associated application or benchmark documentation for detailed integration and usage instructions (e.g., how to set model paths, environment variables and library search paths). +## 📌 Citation Details ---- +```bibtex + @InProceedings{Rombach_2022_CVPR, + author = {Rombach, Robin and Blattmann, Andreas and Lorenz, Dominik and Esser, Patrick and Ommer, Bj\"orn}, + title = {High-Resolution Image Synthesis With Latent Diffusion Models}, + booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)}, + month = {June}, + year = {2022}, + pages = {10684-10695} + } +``` \ No newline at end of file diff --git a/SD1.5 NPU Model support for UL Procyon SD1.5_third_party_notices.txt b/SD1.5 NPU Model support for UL Procyon SD1.5_third_party_notices.txt deleted file mode 100644 index 3847f0fe69eeec18d274cf1004b003316598fc14..0000000000000000000000000000000000000000 --- a/SD1.5 NPU Model support for UL Procyon SD1.5_third_party_notices.txt +++ /dev/null @@ -1,220 +0,0 @@ -Third-Party Notices Report for Inventory for SD1.5 NPU Model support for UL Procyon SD1.5 - - - - AMD copyrighted code (MIT) - - - Copyright Statements - - Copyright (C) 2018 - 2022 Xilinx, Inc. All rights reserved. -Copyright (C) 2022-2024, Advanced Micro Devices, Inc. All Rights Reserved. - - - License Text https://spdx.org/licenses/MIT.html - - - Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: - -The above copyright notice and this permission notice (including the next paragraph) shall be included in all copies or substantial portions of the Software. - -THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. - - AMD copyrighted code (Apache-2.0) - - - Copyright Statements - - Copyright?? 2022-2024 Advanced Micro Devices, Inc. All rights reserved. -Copyright 2015-2022 Xilinx, Inc. All rights reserved - -Copyright (C) 2022 Xilinx, Inc - - License Text https://spdx.org/licenses/Apache-2.0.html - - - Apache License -Version 2.0, January 2004 -http://www.apache.org/licenses/ - -TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION - -1. Definitions. -"License" shall mean the terms and conditions for use, reproduction, and distribution as defined by Sections 1 through 9 of this document. - -"Licensor" shall mean the copyright owner or entity authorized by the copyright owner that is granting the License. - -"Legal Entity" shall mean the union of the acting entity and all other entities that control, are controlled by, or are under common control with that entity. For the purposes of this definition, "control" means (i) the power, direct or indirect, to cause the direction or management of such entity, whether by contract or otherwise, or (ii) ownership of fifty percent (50%) or more of the outstanding shares, or (iii) beneficial ownership of such entity. - -"You" (or "Your") shall mean an individual or Legal Entity exercising permissions granted by this License. - -"Source" form shall mean the preferred form for making modifications, including but not limited to software source code, documentation source, and configuration files. - -"Object" form shall mean any form resulting from mechanical transformation or translation of a Source form, including but not limited to compiled object code, generated documentation, and conversions to other media types. - -"Work" shall mean the work of authorship, whether in Source or Object form, made available under the License, as indicated by a copyright notice that is included in or attached to the work (an example is provided in the Appendix below). - -"Derivative Works" shall mean any work, whether in Source or Object form, that is based on (or derived from) the Work and for which the editorial revisions, annotations, elaborations, or other modifications represent, as a whole, an original work of authorship. For the purposes of this License, Derivative Works shall not include works that remain separable from, or merely link (or bind by name) to the interfaces of, the Work and Derivative Works thereof. - -"Contribution" shall mean any work of authorship, including the original version of the Work and any modifications or additions to that Work or Derivative Works thereof, that is intentionally submitted to Licensor for inclusion in the Work by the copyright owner or by an individual or Legal Entity authorized to submit on behalf of the copyright owner. For the purposes of this definition, "submitted" means any form of electronic, verbal, or written communication sent to the Licensor or its representatives, including but not limited to communication on electronic mailing lists, source code control systems, and issue tracking systems that are managed by, or on behalf of, the Licensor for the purpose of discussing and improving the Work, but excluding communication that is conspicuously marked or otherwise designated in writing by the copyright owner as "Not a Contribution." - -"Contributor" shall mean Licensor and any individual or Legal Entity on behalf of whom a Contribution has been received by Licensor and subsequently incorporated within the Work. - -2. Grant of Copyright License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable copyright license to reproduce, prepare Derivative Works of, publicly display, publicly perform, sublicense, and distribute the Work and such Derivative Works in Source or Object form. -3. Grant of Patent License. Subject to the terms and conditions of this License, each Contributor hereby grants to You a perpetual, worldwide, non-exclusive, no-charge, royalty-free, irrevocable (except as stated in this section) patent license to make, have made, use, offer to sell, sell, import, and otherwise transfer the Work, where such license applies only to those patent claims licensable by such Contributor that are necessarily infringed by their Contribution(s) alone or by combination of their Contribution(s) with the Work to which such Contribution(s) was submitted. If You institute patent litigation against any entity (including a cross-claim or counterclaim in a lawsuit) alleging that the Work or a Contribution incorporated within the Work constitutes direct or contributory patent infringement, then any patent licenses granted to You under this License for that Work shall terminate as of the date such litigation is filed. -4. Redistribution. You may reproduce and distribute copies of the Work or Derivative Works thereof in any medium, with or without modifications, and in Source or Object form, provided that You meet the following conditions: -(a) You must give any other recipients of the Work or Derivative Works a copy of this License; and -(b) You must cause any modified files to carry prominent notices stating that You changed the files; and -(c) You must retain, in the Source form of any Derivative Works that You distribute, all copyright, patent, trademark, and attribution notices from the Source form of the Work, excluding those notices that do not pertain to any part of the Derivative Works; and -(d) If the Work includes a "NOTICE" text file as part of its distribution, then any Derivative Works that You distribute must include a readable copy of the attribution notices contained within such NOTICE file, excluding those notices that do not pertain to any part of the Derivative Works, in at least one of the following places: within a NOTICE text file distributed as part of the Derivative Works; within the Source form or documentation, if provided along with the Derivative Works; or, within a display generated by the Derivative Works, if and wherever such third-party notices normally appear. The contents of the NOTICE file are for informational purposes only and do not modify the License. You may add Your own attribution notices within Derivative Works that You distribute, alongside or as an addendum to the NOTICE text from the Work, provided that such additional attribution notices cannot be construed as modifying the License. -You may add Your own copyright statement to Your modifications and may provide additional or different license terms and conditions for use, reproduction, or distribution of Your modifications, or for any such Derivative Works as a whole, provided Your use, reproduction, and distribution of the Work otherwise complies with the conditions stated in this License. - -5. Submission of Contributions. Unless You explicitly state otherwise, any Contribution intentionally submitted for inclusion in the Work by You to the Licensor shall be under the terms and conditions of this License, without any additional terms or conditions. Notwithstanding the above, nothing herein shall supersede or modify the terms of any separate license agreement you may have executed with Licensor regarding such Contributions. -6. Trademarks. This License does not grant permission to use the trade names, trademarks, service marks, or product names of the Licensor, except as required for reasonable and customary use in describing the origin of the Work and reproducing the content of the NOTICE file. -7. Disclaimer of Warranty. Unless required by applicable law or agreed to in writing, Licensor provides the Work (and each Contributor provides its Contributions) on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied, including, without limitation, any warranties or conditions of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A PARTICULAR PURPOSE. You are solely responsible for determining the appropriateness of using or redistributing the Work and assume any risks associated with Your exercise of permissions under this License. -8. Limitation of Liability. In no event and under no legal theory, whether in tort (including negligence), contract, or otherwise, unless required by applicable law (such as deliberate and grossly negligent acts) or agreed to in writing, shall any Contributor be liable to You for damages, including any direct, indirect, special, incidental, or consequential damages of any character arising as a result of this License or out of the use or inability to use the Work (including but not limited to damages for loss of goodwill, work stoppage, computer failure or malfunction, or any and all other commercial damages or losses), even if such Contributor has been advised of the possibility of such damages. -9. Accepting Warranty or Additional Liability. While redistributing the Work or Derivative Works thereof, You may choose to offer, and charge a fee for, acceptance of support, warranty, indemnity, or other liability obligations and/or rights consistent with this License. However, in accepting such obligations, You may act only on Your own behalf and on Your sole responsibility, not on behalf of any other Contributor, and only if You agree to indemnify, defend, and hold each Contributor harmless for any liability incurred by, or claims asserted against, such Contributor by reason of your accepting any such warranty or additional liability. -END OF TERMS AND CONDITIONS - -APPENDIX: How to apply the Apache License to your work. - -To apply the Apache License to your work, attach the following boilerplate notice, with the fields enclosed by brackets "[]" replaced with your own identifying information. (Don't include the brackets!) The text should be enclosed in the appropriate comment syntax for the file format. We also recommend that a file or class name and description of purpose be included on the same "printed page" as the copyright notice for easier identification within third-party archives. - -Copyright [yyyy] [name of copyright owner] - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - -http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. - -Standard License Header -Copyright [yyyy] [name of copyright owner] - -Licensed under the Apache License, Version 2.0 (the "License"); -you may not use this file except in compliance with the License. -You may obtain a copy of the License at - -http://www.apache.org/licenses/LICENSE-2.0 - -Unless required by applicable law or agreed to in writing, software -distributed under the License is distributed on an "AS IS" BASIS, -WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. -See the License for the specific language governing permissions and -limitations under the License. - - stbrumme-hash-library v-u (Zlib) - - - Copyright Statements - - Copyright (c) 2014,2015 Stephan Brumme - - - License Text https://spdx.org/licenses/Zlib.html - - - This software is provided 'as-is', without any express or implied warranty. In no event will the authors be held liable for any damages arising from the use of this software. - -Permission is granted to anyone to use this software for any purpose, including commercial applications, and to alter it and redistribute it freely, subject to the following restrictions: - -1. The origin of this software must not be misrepresented; you must not claim that you wrote the original software. If you use this software in a product, an acknowledgment in the product documentation would be appreciated but is not required. -2. Altered source versions must be plainly marked as such, and must not be misrepresented as being the original software. -3. This notice may not be removed or altered from any source distribution. - - AMD copyrighted code (BSD-2-Clause) - - - Copyright Statements - - Copyright (C) 2022 Xilinx, Inc. All rights reserved. - * Copyright (C) 2023 ??? 2024 Advanced Micro Devices, Inc. All rights - * reserved - - License Text https://spdx.org/licenses/BSD-2-Clause.html - - - /* - * The Xilinx Vitis AI Vaip in this distribution are provided under the - * following free and permissive binary-only license, but are not provided in - * source code form. While the following free and permissive license is similar - * to the BSD open source license, it is NOT the BSD open source license nor - * other OSI-approved open source license. - * - * Copyright ?? 2020 Xilinx, Inc. - * - * Redistribution and use in binary form only, without modification, is - * permitted provided that the following conditions are met: - * - * 1. Redistributions must reproduce the above copyright notice, this list - * of conditions and the following disclaimer in the documentation and/or other - * materials provided with the distribution. - * - * 2. The name of Xilinx, Inc. may not be used to endorse or promote - * products redistributed with this software without specific prior written - * permission. - * - * THIS SOFTWARE IS PROVIDED BY XILINX, INC. "AS IS" AND ANY EXPRESS OR - * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF - * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO - * EVENT SHALL XILINX, INC. BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, - * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, - * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR - * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF - * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING - * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, - * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE - */ - - Zlib 1.3.1 (Zlib) - - - Copyright Statements - - Copyright (C) 2004, 2008, 2012 Mark Adler, all rights reserved - - License Text https://spdx.org/licenses/Zlib.html - - - This software is provided 'as-is', without any express or implied warranty. In no event will the authors be held liable for any damages arising from the use of this software. - -Permission is granted to anyone to use this software for any purpose, including commercial applications, and to alter it and redistribute it freely, subject to the following restrictions: - -1. The origin of this software must not be misrepresented; you must not claim that you wrote the original software. If you use this software in a product, an acknowledgment in the product documentation would be appreciated but is not required. -2. Altered source versions must be plainly marked as such, and must not be misrepresented as being the original software. -3. This notice may not be removed or altered from any source distribution. - - Zlib-Dotzlib v-u (BSL-1.0) - - - Copyright Statements - - Copyright Henrik Ravn 2004 - - License Text https://spdx.org/licenses/BSL-1.0.html - - - Permission is hereby granted, free of charge, to any person or organization obtaining a copy of the software and accompanying documentation covered by this license (the "Software") to use, reproduce, display, distribute, execute, and transmit the Software, and to prepare derivative works of the Software, and to permit third-parties to whom the Software is furnished to do so, all subject to the following: - -The copyright notices in the Software and this entire statement, including the above license grant, this restriction and the following disclaimer, must be included in all copies of the Software, in whole or in part, and all derivative works of the Software, unless such copies or derivative works are solely in the form of machine-executable object code generated by a source language processor. - -THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. - - Zlib v-u (Public Domain) - - - Copyright Statements - - NA - - License Text - - - Not copyrighted -- provided to the public domain - diff --git a/feature_extractor/preprocessor_config.json b/feature_extractor/preprocessor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..5294955ff7801083f720b34b55d0f1f51313c5c5 --- /dev/null +++ b/feature_extractor/preprocessor_config.json @@ -0,0 +1,20 @@ +{ + "crop_size": 224, + "do_center_crop": true, + "do_convert_rgb": true, + "do_normalize": true, + "do_resize": true, + "feature_extractor_type": "CLIPFeatureExtractor", + "image_mean": [ + 0.48145466, + 0.4578275, + 0.40821073 + ], + "image_std": [ + 0.26862954, + 0.26130258, + 0.27577711 + ], + "resample": 3, + "size": 224 +} diff --git a/libs/fmt.dll b/libs/fmt.dll deleted file mode 100644 index f1f77002adea185d8fd407693af6ee68cc546f14..0000000000000000000000000000000000000000 --- a/libs/fmt.dll +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5794983ed39f2c5da93f9ca1eb4edaf19f5b294b2f602758dabedb637bb32660 -size 132096 diff --git a/libs/onnx_custom_ops.dll b/libs/onnx_custom_ops.dll deleted file mode 100644 index 82474cb62c715f4efff3b86ef779e0a33e420c9a..0000000000000000000000000000000000000000 --- a/libs/onnx_custom_ops.dll +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4a4c644dd19883a39f07529a8f08f10dd5ed0eb1025fc2a288ffe3317bc4a494 -size 305880576 diff --git a/libs/ryzen_mm.dll b/libs/ryzen_mm.dll deleted file mode 100644 index a9db14987cdad1948a213463f3e77f3647163acc..0000000000000000000000000000000000000000 --- a/libs/ryzen_mm.dll +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:be362e0365a3fa7e3536fc32b0ba8c5e0ced5f1d69851426ec9588a13a2ec552 -size 277504 diff --git a/libs/ryzenai_onnx_utils.dll b/libs/ryzenai_onnx_utils.dll deleted file mode 100644 index b424fcf7e0abfd07578e91e007a27a74a24d7726..0000000000000000000000000000000000000000 Binary files a/libs/ryzenai_onnx_utils.dll and /dev/null differ diff --git a/libs/spdlog.dll b/libs/spdlog.dll deleted file mode 100644 index 069468934c8a09b44ca708a91a0e6ff235729f53..0000000000000000000000000000000000000000 --- a/libs/spdlog.dll +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bda960958e994d3f2b5004501a30bfc3e6a1bcbb152613e581ee5282273e8122 -size 264704 diff --git a/ryzen-ai-end-user-license-agreement-public.pdf b/ryzen-ai-end-user-license-agreement-public.pdf deleted file mode 100644 index 396833d17be25892ceb2e96b985e9e458d98337c..0000000000000000000000000000000000000000 --- a/ryzen-ai-end-user-license-agreement-public.pdf +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:587c5b4916ae6053f4a2fbc0a063532bd4ff9e50080491e75cb349c84f2b97a7 -size 168872 diff --git a/safety_checker/config.json b/safety_checker/config.json new file mode 100644 index 0000000000000000000000000000000000000000..5dbd88952e7e521aa665e5052e6db7def3641d03 --- /dev/null +++ b/safety_checker/config.json @@ -0,0 +1,175 @@ +{ + "_commit_hash": "4bb648a606ef040e7685bde262611766a5fdd67b", + "_name_or_path": "CompVis/stable-diffusion-safety-checker", + "architectures": [ + "StableDiffusionSafetyChecker" + ], + "initializer_factor": 1.0, + "logit_scale_init_value": 2.6592, + "model_type": "clip", + "projection_dim": 768, + "text_config": { + "_name_or_path": "", + "add_cross_attention": false, + "architectures": null, + "attention_dropout": 0.0, + "bad_words_ids": null, + "bos_token_id": 0, + "chunk_size_feed_forward": 0, + "cross_attention_hidden_size": null, + "decoder_start_token_id": null, + "diversity_penalty": 0.0, + "do_sample": false, + "dropout": 0.0, + "early_stopping": false, + "encoder_no_repeat_ngram_size": 0, + "eos_token_id": 2, + "exponential_decay_length_penalty": null, + "finetuning_task": null, + "forced_bos_token_id": null, + "forced_eos_token_id": null, + "hidden_act": "quick_gelu", + "hidden_size": 768, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1" + }, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 3072, + "is_decoder": false, + "is_encoder_decoder": false, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1 + }, + "layer_norm_eps": 1e-05, + "length_penalty": 1.0, + "max_length": 20, + "max_position_embeddings": 77, + "min_length": 0, + "model_type": "clip_text_model", + "no_repeat_ngram_size": 0, + "num_attention_heads": 12, + "num_beam_groups": 1, + "num_beams": 1, + "num_hidden_layers": 12, + "num_return_sequences": 1, + "output_attentions": false, + "output_hidden_states": false, + "output_scores": false, + "pad_token_id": 1, + "prefix": null, + "problem_type": null, + "pruned_heads": {}, + "remove_invalid_values": false, + "repetition_penalty": 1.0, + "return_dict": true, + "return_dict_in_generate": false, + "sep_token_id": null, + "task_specific_params": null, + "temperature": 1.0, + "tf_legacy_loss": false, + "tie_encoder_decoder": false, + "tie_word_embeddings": true, + "tokenizer_class": null, + "top_k": 50, + "top_p": 1.0, + "torch_dtype": null, + "torchscript": false, + "transformers_version": "4.22.0.dev0", + "typical_p": 1.0, + "use_bfloat16": false, + "vocab_size": 49408 + }, + "text_config_dict": { + "hidden_size": 768, + "intermediate_size": 3072, + "num_attention_heads": 12, + "num_hidden_layers": 12 + }, + "torch_dtype": "float32", + "transformers_version": null, + "vision_config": { + "_name_or_path": "", + "add_cross_attention": false, + "architectures": null, + "attention_dropout": 0.0, + "bad_words_ids": null, + "bos_token_id": null, + "chunk_size_feed_forward": 0, + "cross_attention_hidden_size": null, + "decoder_start_token_id": null, + "diversity_penalty": 0.0, + "do_sample": false, + "dropout": 0.0, + "early_stopping": false, + "encoder_no_repeat_ngram_size": 0, + "eos_token_id": null, + "exponential_decay_length_penalty": null, + "finetuning_task": null, + "forced_bos_token_id": null, + "forced_eos_token_id": null, + "hidden_act": "quick_gelu", + "hidden_size": 1024, + "id2label": { + "0": "LABEL_0", + "1": "LABEL_1" + }, + "image_size": 224, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 4096, + "is_decoder": false, + "is_encoder_decoder": false, + "label2id": { + "LABEL_0": 0, + "LABEL_1": 1 + }, + "layer_norm_eps": 1e-05, + "length_penalty": 1.0, + "max_length": 20, + "min_length": 0, + "model_type": "clip_vision_model", + "no_repeat_ngram_size": 0, + "num_attention_heads": 16, + "num_beam_groups": 1, + "num_beams": 1, + "num_channels": 3, + "num_hidden_layers": 24, + "num_return_sequences": 1, + "output_attentions": false, + "output_hidden_states": false, + "output_scores": false, + "pad_token_id": null, + "patch_size": 14, + "prefix": null, + "problem_type": null, + "pruned_heads": {}, + "remove_invalid_values": false, + "repetition_penalty": 1.0, + "return_dict": true, + "return_dict_in_generate": false, + "sep_token_id": null, + "task_specific_params": null, + "temperature": 1.0, + "tf_legacy_loss": false, + "tie_encoder_decoder": false, + "tie_word_embeddings": true, + "tokenizer_class": null, + "top_k": 50, + "top_p": 1.0, + "torch_dtype": null, + "torchscript": false, + "transformers_version": "4.22.0.dev0", + "typical_p": 1.0, + "use_bfloat16": false + }, + "vision_config_dict": { + "hidden_size": 1024, + "intermediate_size": 4096, + "num_attention_heads": 16, + "num_hidden_layers": 24, + "patch_size": 14 + } +} diff --git a/scheduler/scheduler_config.json b/scheduler/scheduler_config.json index 05ea38b0bf1f05eab83238c95aa943d28d9feec2..5c92390913b1a3948d08295f2e1dc150b1f1f79c 100644 --- a/scheduler/scheduler_config.json +++ b/scheduler/scheduler_config.json @@ -1,19 +1,13 @@ { "_class_name": "PNDMScheduler", - "_diffusers_version": "0.31.0", + "_diffusers_version": "0.6.0", "beta_end": 0.012, "beta_schedule": "scaled_linear", "beta_start": 0.00085, - "clip_sample": false, - "clip_sample_range": 1.0, - "dynamic_thresholding_ratio": 0.995, "num_train_timesteps": 1000, - "prediction_type": "epsilon", - "sample_max_value": 1.0, "set_alpha_to_one": false, "skip_prk_steps": true, "steps_offset": 1, - "thresholding": false, - "timestep_spacing": "leading", - "trained_betas": null + "trained_betas": null, + "clip_sample": false } diff --git a/text_encoder/config.json b/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..4d3e873ab5086ad989f407abd50fdce66db8d657 --- /dev/null +++ b/text_encoder/config.json @@ -0,0 +1,25 @@ +{ + "_name_or_path": "openai/clip-vit-large-patch14", + "architectures": [ + "CLIPTextModel" + ], + "attention_dropout": 0.0, + "bos_token_id": 0, + "dropout": 0.0, + "eos_token_id": 2, + "hidden_act": "quick_gelu", + "hidden_size": 768, + "initializer_factor": 1.0, + "initializer_range": 0.02, + "intermediate_size": 3072, + "layer_norm_eps": 1e-05, + "max_position_embeddings": 77, + "model_type": "clip_text_model", + "num_attention_heads": 12, + "num_hidden_layers": 12, + "pad_token_id": 1, + "projection_dim": 768, + "torch_dtype": "float32", + "transformers_version": "4.22.0.dev0", + "vocab_size": 49408 +} diff --git a/text_encoder/model.onnx b/text_encoder/model.onnx deleted file mode 100644 index fc4493364612545c5035a9ed528963175134b11a..0000000000000000000000000000000000000000 --- a/text_encoder/model.onnx +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:225c1b4a1421e615946d416934e86a2445693e560d550405ef0dcb7218294d54 -size 246473790 diff --git a/text_encoder/model.safetensors b/text_encoder/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..681382f735a1ae457c891ac30bd9e611b7b10091 --- /dev/null +++ b/text_encoder/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d008943c017f0092921106440254dbbe00b6a285f7883ec8ba160c3faad88334 +size 492265874 diff --git a/tokenizer/special_tokens_map.json b/tokenizer/special_tokens_map.json index fc4052df9224ad33df97634e865128642aa12128..ad919e089d4d032a933a2a9087de2857d55af3bc 100644 --- a/tokenizer/special_tokens_map.json +++ b/tokenizer/special_tokens_map.json @@ -13,13 +13,7 @@ "rstrip": false, "single_word": false }, - "pad_token": { - "content": "<|endoftext|>", - "lstrip": false, - "normalized": true, - "rstrip": false, - "single_word": false - }, + "pad_token": "<|endoftext|>", "unk_token": { "content": "<|endoftext|>", "lstrip": false, diff --git a/tokenizer/tokenizer_config.json b/tokenizer/tokenizer_config.json index d3269e79768869e2475079df12936e4f5a5f00e2..ecce7b0cfe89c534c5d54b50aeec0a8b277d9fc9 100644 --- a/tokenizer/tokenizer_config.json +++ b/tokenizer/tokenizer_config.json @@ -1,30 +1,34 @@ { "add_prefix_space": false, - "added_tokens_decoder": { - "49406": { - "content": "<|startoftext|>", - "lstrip": false, - "normalized": true, - "rstrip": false, - "single_word": false, - "special": true - }, - "49407": { - "content": "<|endoftext|>", - "lstrip": false, - "normalized": true, - "rstrip": false, - "single_word": false, - "special": true - } + "bos_token": { + "__type": "AddedToken", + "content": "<|startoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false }, - "bos_token": "<|startoftext|>", - "clean_up_tokenization_spaces": true, "do_lower_case": true, - "eos_token": "<|endoftext|>", + "eos_token": { + "__type": "AddedToken", + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + }, "errors": "replace", "model_max_length": 77, + "name_or_path": "openai/clip-vit-large-patch14", "pad_token": "<|endoftext|>", + "special_tokens_map_file": "./special_tokens_map.json", "tokenizer_class": "CLIPTokenizer", - "unk_token": "<|endoftext|>" + "unk_token": { + "__type": "AddedToken", + "content": "<|endoftext|>", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false + } } diff --git a/unet/.cache/NhwcConv_0-conv_inConv_0.const b/unet/.cache/NhwcConv_0-conv_inConv_0.const deleted file mode 100644 index 445dfd25917ed0ab833b29a54864a66547cae708..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_0.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_1.const b/unet/.cache/NhwcConv_0-conv_inConv_1.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_1.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_10.const b/unet/.cache/NhwcConv_0-conv_inConv_10.const deleted file mode 100644 index 3c7fc6eb6957f70044f3915160de63164042f882..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_10.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9287037a4ff616e8340c495ba5aed425a01c49ebead342c2734895c3944c976 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_100.const b/unet/.cache/NhwcConv_0-conv_inConv_100.const deleted file mode 100644 index d2cb3fae8bcecf5589709de33f5116403e4fab3a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_100.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7f363eda1b86f2510b5c4bbfa8e4304a4eba32883eabb34b49dfff96daf01f05 -size 934400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_101.const b/unet/.cache/NhwcConv_0-conv_inConv_101.const deleted file mode 100644 index 7abf61923797e41f775c00c53ff718b078d79581..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_101.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3fda54a817686d9eaa2057ce4ac843ce21c4cd2abab55f33692c9939d4f74c6b -size 934400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_102.const b/unet/.cache/NhwcConv_0-conv_inConv_102.const deleted file mode 100644 index 23d8b7ee99b59d6eeec93996626b61290e6a29e8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_102.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:eabd19f63008feea9cbfc76a985a5bb20c17d5157e86563375cabf3f2e6c62f3 -size 934400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_103.const b/unet/.cache/NhwcConv_0-conv_inConv_103.const deleted file mode 100644 index 529b3b298b1636800b90cab23de990d52c1c68d9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_103.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dd6e802361a2f3515cd1667d6cdf4370642dbd15f90b3c2d4d9bc0810b3c0c28 -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_104.const b/unet/.cache/NhwcConv_0-conv_inConv_104.const deleted file mode 100644 index ebe3433eb64741bf56e25afca03c96e51fe14f94..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_104.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f6b2a6024142d0c528445fbea7deb5c608bc01726272fe7bbef4a0b7a83ead0a -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_105.const b/unet/.cache/NhwcConv_0-conv_inConv_105.const deleted file mode 100644 index 0a737b2e42b4915ef34073ac703ec19f71673302..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_105.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d5f0384740d1ab366abc59c6135a0d06cea3b6b0bec92341441258fe7668a98d -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_106.const b/unet/.cache/NhwcConv_0-conv_inConv_106.const deleted file mode 100644 index 769d0c646537b841ba432f1c2a948e1ee70ee6d8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_106.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e8a66a51189e8bd5e8bf40d945cd70bafeada5d17bc8feb4b0c0180f95427fa6 -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_107.const b/unet/.cache/NhwcConv_0-conv_inConv_107.const deleted file mode 100644 index c523de3931c2dc8a0be155386bc63c43c3ffaaa9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_107.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:98f64dce1ec91a0c3361deb40b171cb6394fb7e1ff035260ccafbb2982d899a0 -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_108.const b/unet/.cache/NhwcConv_0-conv_inConv_108.const deleted file mode 100644 index 9c3184f7efde52a131c814d58d044dbe66daca74..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_108.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c4548f8a18eef990420f7fae92e90d527d2770fd622b04f19ccfd8cc1ed5fa4f -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_109.const b/unet/.cache/NhwcConv_0-conv_inConv_109.const deleted file mode 100644 index 593b2df0afd5f63c5e169645dfb5ee1c4967d38d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_109.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2862931e79a38b0c4544e2e6bc1748b5599ca5802eae8969fe6d246811f44f00 -size 467200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_11.const b/unet/.cache/NhwcConv_0-conv_inConv_11.const deleted file mode 100644 index 1cdd29baeaddb664f83982b29c4a08eef1fb8d1e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_11.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3d8a4370ae222b6b427a38c106a2b4e851e61c8c2d2258c9408a7ccf0e9a2ef5 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_110.const b/unet/.cache/NhwcConv_0-conv_inConv_110.const deleted file mode 100644 index 451a7f1dad0598e2a2a77cd45820037c412adfd9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_110.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33d791c02c790bb84b0459276c9760feded2a21eb5050ec4da6658c0ae87d505 -size 467200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_111.const b/unet/.cache/NhwcConv_0-conv_inConv_111.const deleted file mode 100644 index 313f7626b6b5b8eee107b80e2cb83634827403e5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_111.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:96da6df55780f55bd4317d4cd17fb93633f153363df6bd2bb906a4e8774e6d69 -size 467200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_112.const b/unet/.cache/NhwcConv_0-conv_inConv_112.const deleted file mode 100644 index f5ad0ebffe15ce274148003c2d09f58d31321bf9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_112.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a20154997a7e6c16103c8d13122d9b59c70428acee57c0fe1dfd15619c904739 -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_113.const b/unet/.cache/NhwcConv_0-conv_inConv_113.const deleted file mode 100644 index 41cb3dff1babb9f031336f6a6086a10cb057b8a9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_113.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7eba2d5e4be63117ec4f8fbd51f959a50ac5a0c30a55d2c5aab62a1d121d57d0 -size 250880 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_114.const b/unet/.cache/NhwcConv_0-conv_inConv_114.const deleted file mode 100644 index 03f8595e4b04fa9f640a7826fa70d2f250a78c39..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_114.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_115.const b/unet/.cache/NhwcConv_0-conv_inConv_115.const deleted file mode 100644 index 4f2248e72ff765fe68a28e6dd820b7ed09276fca..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_115.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:18a7bb0c7495c962f7436fe4c252ec6aea0f0c01416098112bd42c559e8d4a9f -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_116.const b/unet/.cache/NhwcConv_0-conv_inConv_116.const deleted file mode 100644 index ded50b479454acd523624899b4e77bd63c2863a0..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_116.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_117.const b/unet/.cache/NhwcConv_0-conv_inConv_117.const deleted file mode 100644 index a2f61f0e1f026697fadca845633629c0770c11db..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_117.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_118.const b/unet/.cache/NhwcConv_0-conv_inConv_118.const deleted file mode 100644 index 7eb5e3e922a64f0972ff39cc929717d1e2037d56..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_118.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:422ba5540a498cef728922c329ad5389e46a287e18c45eff619b77fbb23ae657 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_119.const b/unet/.cache/NhwcConv_0-conv_inConv_119.const deleted file mode 100644 index e09204f123cf45a4346e571305d9cbb4f42210ea..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_119.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:17bdf2ffecaebea1e3c02a64039eae8707e277452aedf0ad7e5da887d1afa084 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_12.const b/unet/.cache/NhwcConv_0-conv_inConv_12.const deleted file mode 100644 index 24a4c90677931fc9a478232e2cd04b97b1d41b56..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_12.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9bda1fac569a7d1e5e4761882f3f54ef2b1115b2ce0348414bbbb809a1ff8f37 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_120.const b/unet/.cache/NhwcConv_0-conv_inConv_120.const deleted file mode 100644 index 44d4299da5800c9595f378503a5af8f8c09864ee..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_120.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fb6d65075a39b439764372629d89edb3ebf47c1e63a83998ccdf2f6aa0455ad3 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_121.const b/unet/.cache/NhwcConv_0-conv_inConv_121.const deleted file mode 100644 index 5441908d29d1b36e2812133d06a10bc56eee7b60..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_121.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:880bcf7442c67df41afa34d7cad96a186f7ec5cdbee840a59d354cbf11945297 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_122.const b/unet/.cache/NhwcConv_0-conv_inConv_122.const deleted file mode 100644 index ba3ee889dc2714b6e67c7b390566e5d4be06a9bf..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_122.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_123.const b/unet/.cache/NhwcConv_0-conv_inConv_123.const deleted file mode 100644 index d29b678bbcccb34eed6b086aeda4784891cff154..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_123.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_124.const b/unet/.cache/NhwcConv_0-conv_inConv_124.const deleted file mode 100644 index 093c8dc750606fb2038825d1f515f5ad9b5939f0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_124.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2b2e1bbb8158545a312c336d2786df561672800d201f189785c7fdb87caa2b41 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_125.const b/unet/.cache/NhwcConv_0-conv_inConv_125.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_125.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_126.const b/unet/.cache/NhwcConv_0-conv_inConv_126.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_126.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_127.const b/unet/.cache/NhwcConv_0-conv_inConv_127.const deleted file mode 100644 index e6bda382e24d905b62ab88896d0a3e34f50b10f5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_127.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:815b40ccad7d537efc35775abb325a102b91c18300e93692bfc0bb8dbccd605f -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_128.const b/unet/.cache/NhwcConv_0-conv_inConv_128.const deleted file mode 100644 index e2247b7c890176d64cf6acd7c34229498b08f782..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_128.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>r>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>|>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>|>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>{>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>~>>u>>>>>>>>>>>>>>>>>>>>>>p>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>S>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_129.const b/unet/.cache/NhwcConv_0-conv_inConv_129.const deleted file mode 100644 index 6cd20333675af57468da16c4c26618e56aaef6b1..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_129.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_13.const b/unet/.cache/NhwcConv_0-conv_inConv_13.const deleted file mode 100644 index 200c9185ecbd085e53dc2318af4f98f8f9af491d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_13.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1962323973f3ec810487b147b1a4e115c66113147b577a0a9d3b937d56710f7d -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_130.const b/unet/.cache/NhwcConv_0-conv_inConv_130.const deleted file mode 100644 index 946a62cb94077c14d0512c9116ca205a344e1a70..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_130.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c55b8c2cb730229bdcc8b1c45255eb3cece8927e2ab8b9afe26070f39825d0da -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_131.const b/unet/.cache/NhwcConv_0-conv_inConv_131.const deleted file mode 100644 index 3762ae803b2c32e2905f3acf32d646f74e4a14e8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_131.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7b5f8e5e0b60c9faa35079eec6744cec80b1c3e93b7a55833ef1d7ef90b47fa2 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_132.const b/unet/.cache/NhwcConv_0-conv_inConv_132.const deleted file mode 100644 index 4b5476a9c30add020d85e7b90297d83ae969c190..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_132.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:999a99b5843f8c57bc2ac271dc1ca26bf24b0d38faff32cc8d317ada954ef7f1 -size 1884160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_133.const b/unet/.cache/NhwcConv_0-conv_inConv_133.const deleted file mode 100644 index 23e7368fb8231e9411b9d887824a4d21f2ed8d8d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_133.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:19b3940282e1345d25bfa370bd50e57c0ef468e40485a624ab921f03a5c33b6d -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_134.const b/unet/.cache/NhwcConv_0-conv_inConv_134.const deleted file mode 100644 index bc71835776d7621300d42ec99aaf666c471a203d..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_134.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_135.const b/unet/.cache/NhwcConv_0-conv_inConv_135.const deleted file mode 100644 index 04a40bcf47d219cfe734f7e964fb8d46c002517e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_135.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c16d98979978f325a09a690121149e968e98e477943b5ca76d8e50cbb91fd0d1 -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_136.const b/unet/.cache/NhwcConv_0-conv_inConv_136.const deleted file mode 100644 index dbf92fb919a9ffe394f79e40829e2ec9ae76ed66..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_136.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_137.const b/unet/.cache/NhwcConv_0-conv_inConv_137.const deleted file mode 100644 index 6be1f0846c44bac1313ad249c9ea71431a64c80e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_137.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd09543d7284a4e6740f0455d3933da6d1a6bbfa3fc286fdba78e0ff0b2bad5e -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_138.const b/unet/.cache/NhwcConv_0-conv_inConv_138.const deleted file mode 100644 index 6bad565c3f9bba8d742ce3bb0a3d47dd0862dfe6..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_138.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_139.const b/unet/.cache/NhwcConv_0-conv_inConv_139.const deleted file mode 100644 index 706f3f9bbcbe82ece4fd770d1f32ea10d450f3e2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_139.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c9f0b5b7b1c361f1923e693dae069389316cf9a9a90a56f9595132c816cefe9b -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_14.const b/unet/.cache/NhwcConv_0-conv_inConv_14.const deleted file mode 100644 index 319d723e31c3d71100de515100e0d628f9711aa3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_14.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:545263bd1d585f332350a001602642d86c7f23ad0bd9d17b7bde152543780a31 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_140.const b/unet/.cache/NhwcConv_0-conv_inConv_140.const deleted file mode 100644 index dd09d20b38186bc1b5f23d89fb00c2244b3fe7dd..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_140.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_141.const b/unet/.cache/NhwcConv_0-conv_inConv_141.const deleted file mode 100644 index 8eb2b6765c5d661fc94bd6430dd18d2d78230d72..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_141.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_142.const b/unet/.cache/NhwcConv_0-conv_inConv_142.const deleted file mode 100644 index 6f1e930f59bd6345f48a042d2f70a49f87892014..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_142.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:977213a7d13efba49c5630092e3993f5b5a1fd09dd9ee0013bcc7724aa2fb171 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_143.const b/unet/.cache/NhwcConv_0-conv_inConv_143.const deleted file mode 100644 index f49e966c083a9ad96cd18d901c217dcdad38873c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_143.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9109cd3dd0e72761a665f8353b3a9ac533a3e112247ef1e08bf5e74410f5712d -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_144.const b/unet/.cache/NhwcConv_0-conv_inConv_144.const deleted file mode 100644 index 7671bef3e6c32ab0d6ca6a496aa3705d632bb006..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_144.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:74b8a10eaa5a8b3d4ccbff42c4fd9c178665e33f5821345f072d142a882cf585 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_145.const b/unet/.cache/NhwcConv_0-conv_inConv_145.const deleted file mode 100644 index 65e88369f87994d11e701eae342d77ec3393a611..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_145.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:02b18971a662c7cb30ed5bbe2a562b2810aaba4e329e4569a7971fbfb64dda23 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_146.const b/unet/.cache/NhwcConv_0-conv_inConv_146.const deleted file mode 100644 index 5e86e7a42be74974b65ee303da63fa1c15452e43..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_146.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>T>>>>>>>>>>>>>>>>>>>>>>>>>>>>>t>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>v>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_147.const b/unet/.cache/NhwcConv_0-conv_inConv_147.const deleted file mode 100644 index b901ec7cd73996688ee97314f4c1870d43033025..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_147.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_148.const b/unet/.cache/NhwcConv_0-conv_inConv_148.const deleted file mode 100644 index 1d91467c0269bd3afdf260107da19f99a401b74c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_148.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b0e1e77204c552fa2998f5fdcaad508f255eceea893ac749896ada7a036693d4 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_149.const b/unet/.cache/NhwcConv_0-conv_inConv_149.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_149.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_15.const b/unet/.cache/NhwcConv_0-conv_inConv_15.const deleted file mode 100644 index 1b856aaab00bdd4e0f79c13e374181ff822ce786..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_15.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6d9d8875ddb8bea1e721ccd1db33380a2328c2a62cb16c8dc7deaca79817b6c5 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_150.const b/unet/.cache/NhwcConv_0-conv_inConv_150.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_150.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_151.const b/unet/.cache/NhwcConv_0-conv_inConv_151.const deleted file mode 100644 index 462e89d49d1070d58875109c2ffb69feb88cd70d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_151.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:04299c265d39a8de98e2178da251b49dc76c375b1f220eb296b512e597549218 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_152.const b/unet/.cache/NhwcConv_0-conv_inConv_152.const deleted file mode 100644 index ca413ddd873ccdd42870f252b4008ec97696e472..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_152.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>f>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>V>>>>>>>>>>>>>>>>>>>>>>>>>>>>> >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>M>>>>>>>>>>>>>>>>>>>>>>>>>>b>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>q>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>J>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_153.const b/unet/.cache/NhwcConv_0-conv_inConv_153.const deleted file mode 100644 index 2a9d25c7c560deec1473c7c21bfe85c1bed1bd0a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_153.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_154.const b/unet/.cache/NhwcConv_0-conv_inConv_154.const deleted file mode 100644 index 2518a97b2d56329ff87c798481d31f5dfa703bf4..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_154.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c5935f63383ae4cbcb5b05f12a9882e1050744046a1ab92b44b49eb805272081 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_155.const b/unet/.cache/NhwcConv_0-conv_inConv_155.const deleted file mode 100644 index bcbb0ac8193c9bf4f51091026787ce2fdb919af9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_155.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:05cde10ae7402a5c5435bb116ae48560bcf419cd24be6ed8d5baa5e280f69fb2 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_156.const b/unet/.cache/NhwcConv_0-conv_inConv_156.const deleted file mode 100644 index 661b758f169a1fcb6a941523f2872f45b10d76f3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_156.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5deee15cfda59a34ee0630f9bc043a2c20d384207245a9c90391419b55674081 -size 1884160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_157.const b/unet/.cache/NhwcConv_0-conv_inConv_157.const deleted file mode 100644 index 97ef6266984ed2b45a8b22c02095abe3df149e33..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_157.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bd5a5403d1ed71647444ba4c6b116bc1ab830c6da3692691c3c63b516174c8fa -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_158.const b/unet/.cache/NhwcConv_0-conv_inConv_158.const deleted file mode 100644 index 357ad6c978687312cd7c781e5e3ef3b233a75022..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_158.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d56caeed65c6e6e454668c715d0a63e4599634ca76b4c90726dcc6fdb12bdabb -size 4249600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_159.const b/unet/.cache/NhwcConv_0-conv_inConv_159.const deleted file mode 100644 index eb36abf636249b34db544fa5d2b0cc9ef744d26c..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_159.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_16.const b/unet/.cache/NhwcConv_0-conv_inConv_16.const deleted file mode 100644 index a37ad7d3f734d9c09d8fc285cb0a4f541fdb8db7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_16.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3b3154e6d64099d5033e3225fcdcf45aab34afc8117561d76aac6bc175c71018 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_160.const b/unet/.cache/NhwcConv_0-conv_inConv_160.const deleted file mode 100644 index 1f16ac49a493b6e504fda15693908780c1bad654..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_160.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:41e2101c0afd4487152ee58ff1a8473daeb0b7020d52d6436b87279f67aed461 -size 8458240 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_161.const b/unet/.cache/NhwcConv_0-conv_inConv_161.const deleted file mode 100644 index 5680cf04332700de015b06e7ce87d665ff53c5a1..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_161.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_162.const b/unet/.cache/NhwcConv_0-conv_inConv_162.const deleted file mode 100644 index f46303bd27468717fb53c7990c28f17b4ba75dcd..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_162.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f19289ade01e596e32d9feb66d040dfd24d616ce5684da8e2de7270904decfb4 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_163.const b/unet/.cache/NhwcConv_0-conv_inConv_163.const deleted file mode 100644 index 719ccd29c9c55ff770a59709d0bdb3146c357e77..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_163.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2fc35d49c44dc52eefae24e84709a036a07b66da23bb6ada75a7e966bc24fc1a -size 1003520 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_164.const b/unet/.cache/NhwcConv_0-conv_inConv_164.const deleted file mode 100644 index bc606c68dbc0009eb92bb1dc01deaac06e1e8868..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_164.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_165.const b/unet/.cache/NhwcConv_0-conv_inConv_165.const deleted file mode 100644 index c33bb0d2d9a8c140ab4e6862f81740a27ba931e8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_165.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:98e6036c0dfdb1be21de7431172cb89c38bbfdf7758ffd4e579f5526663afb6a -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_166.const b/unet/.cache/NhwcConv_0-conv_inConv_166.const deleted file mode 100644 index 8128723a243c2ac3f5ea7d89c02b5a43d13c02ce..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_166.const +++ /dev/null @@ -1,3 +0,0 @@ ->>>>>>>>>>>:>>6>>>>>O>>>>>>>>>}>f>>>>>V>>>>>>>>>>w>>>=>>>>>>>z>>>>>s>>>>>>>>>=>Z>>>>>>>>>R>>>>>>>>>>{>>>>;>>>>>>>>h>w>=>>>>>>>>>b>>>>>u>_>>>>>>j>B>>>>>>>>>>>}>>>>>>>>D>>>>>>>>>>>=>>z>>>>>d>>>>>>>>>>>>U>>>e>>>{>>>>>p>>>>>=>>>X>>>>e>>>>>>>>=>>>>j>>>>>9>e>>>z>|>>x>>=b>>>>>Y>>>0>>{>>>>>z>>S>N>>>>>>>}>>>>>o>>>k>u>>>>U>>>>>>>>>>>=>d>>>>>>>q>>>>>t>>>>H>>>>>>>>>>>>>Y>>>/>>>A>>>>>u>X>>P>>>>^>>>>>>2>>>2>>>>>>4>>>>>>>>>>>>>z>>\>r>>M>>>>Z>>>>= ->>=>>>>=g>>>>>>>>>T>>>>y>>>>>>>>>v>>2>x>>>>>>}>>>>>>r>>>>=>>>>>>>N>t>>>2>>>>>>>>>>>>>>>>G>}>2>>>>>o>k>>>r>k>>=>>>>~>>>v>>>>>h>>>v>>>>>N>>>>>>C>>>>M>~>>>>>>>>>>>>>>h>[>%>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>P>>>>>>2>>>g>>>@>>> >>>}>>>>>>>>>>o>>>Y>>>>r>>]>>>>>>>>>>>>w>t>>>>>>>>>>>>>>>=>>|>g>>>=V>}>>>>>W>>>>>>>>>_>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>H>t>>>>>>>>>{>>>>>>>>x>=>>>>>>>>=>>>>C>>>v>>>>>>>>>>>>>>>>>x>=>>>>>>>>>N>>>>>}>>>}>>>>>i>>>>w>>>>>>>=>>>~>>>>>d>>>>>>>>>^>1>>>>>>>>Q>R>>U>>>+>>>>^>>o>>>>>>{>>>>>>>>>>>>>>>>>>>>>>>>>p>x>>>>>>>>>W>>>>>>o>>/>>>>>>>w>>>>>>>>>>>>9>>>>>>>>>{>>>>$>>>>>>>>>U>>%>>>>>/>>>>>>N>>>>>>>>>>>>>>>>#>{>>>n>?>>>v>>>>>>>>>>>>>v>U>>>o>>e>> >>>>>>>>>3>>>O>>>>7>>7>>>>>>>>>>>>>>G>>>>>C>>>>>>^>>>>t>>>>>>>>t>w>A>>>>>>>>>>~>>E>>>H>>>~>9>>>>>>>>>>>>>R>>>n>~>>>>f>>y>>>>>>>>>>>>>o>>y>>>i>>>Q>>>>>>>>>>>">>{>>>>>>>>>>>>i>>>>>>>S>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>(>>>}>>b>>>>>>>>>>>>>>>>>>>>>>_>>>=>>>>>>>O>>>>>>>>>>>>x>>M>=>>>>>>>>>>>>>>>>>>>>B>>>>>>>>>I>c>P>s>{>>>>>>>>>>m>>>>>>>~>>>>>3>>>>>m>>>>>1>>>>>>>>>t>>:>=>>>>>>>e>0>>>>>>>> ->>>>>>`>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_167.const b/unet/.cache/NhwcConv_0-conv_inConv_167.const deleted file mode 100644 index 88355555b13423596553f71c790d598dbc2ac966..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_167.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_168.const b/unet/.cache/NhwcConv_0-conv_inConv_168.const deleted file mode 100644 index cc192342e408fb87aa84137fe84ba64f42ee93ac..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_168.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:182590615728c427d62dc2cf6a90a90f7bbd5fd3eb9ea8d99abd8256bb8c4074 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_169.const b/unet/.cache/NhwcConv_0-conv_inConv_169.const deleted file mode 100644 index a83940a49ad5ff08c391577c51f65dc65749eb18..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_169.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e3477dd46c03ccefbe5fbd01830360a2a0a51ae117e9b1d9a3a6fd3574bf35d6 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_17.const b/unet/.cache/NhwcConv_0-conv_inConv_17.const deleted file mode 100644 index 883333ef11fd409f389592dac00d7bc6d500f989..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_17.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f65a7223c99ce551a08d89beb42dca12d2372f9f1c3f5eccf80fe88da2e56b03 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_170.const b/unet/.cache/NhwcConv_0-conv_inConv_170.const deleted file mode 100644 index 216616c5e65f8ff09facb0d24d079f4c536313ec..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_170.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a81ad61c703ca7eb650ec5a12558f937b7f614744977e3ce188ce939284c86e3 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_171.const b/unet/.cache/NhwcConv_0-conv_inConv_171.const deleted file mode 100644 index 7b37edd3373468c6a8ae9decd4d406edd78f1026..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_171.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:349d06af53dcc2af8bca51904db4f143f71faed233f4ba0acebb6ec39ee92b90 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_172.const b/unet/.cache/NhwcConv_0-conv_inConv_172.const deleted file mode 100644 index ca18ffd1820a3616f4598b39492e371a18addd10..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_172.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>i>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>4>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>q>>>2>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>5>>>>>>*>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>5>>>>>>>>>>>>>x>>>>p>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>c>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>~>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>`>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>k>>>>>>>>>>>>>>>>o>>>>>>>>>>>>>>9>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>m>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>u>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_173.const b/unet/.cache/NhwcConv_0-conv_inConv_173.const deleted file mode 100644 index 708f365ed1778f46c9d3b38080101e1f28f193c0..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_173.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_174.const b/unet/.cache/NhwcConv_0-conv_inConv_174.const deleted file mode 100644 index 9b7f6a85807db697ec90987ebcb98e904333f60a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_174.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:82d6c288b2844a3096d68605ccfd3825132881db3b138e2b41fc68f6fbd20516 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_175.const b/unet/.cache/NhwcConv_0-conv_inConv_175.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_175.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_176.const b/unet/.cache/NhwcConv_0-conv_inConv_176.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_176.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_177.const b/unet/.cache/NhwcConv_0-conv_inConv_177.const deleted file mode 100644 index c1c7c94f37af14dfa42032309cabdae9252dc50e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_177.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5fe581bc225a0b0065d12a1b56034871734399aa51e91defe42a4b2503b6360e -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_178.const b/unet/.cache/NhwcConv_0-conv_inConv_178.const deleted file mode 100644 index 7b5ed0e6b2a7aa741a6885aa928135f92cf19353..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_178.const +++ /dev/null @@ -1 +0,0 @@ -a>]>\>f>_>a>a>Z>^>e>_>h>b>e>U>T>]>[>g>`>_>]>e>a>\>^>\>c>c>g>c>]>_>h>c>e>e>b>`>g>e>_>]>\>\>_>i>`>X>^>d>Y>a>\>a>h>Y>^>_>^>`>e>\>_>b>`>\>^>b>Y>d>_>g>a>b>h>e>b>_>f>b>c>b>^>a>f>c>d>d>f>b>l>b>d>b>_>\>^>d>`>b>X>a>a>c>b>_>\>^>_>]>b>_>`>e>c>f>`>]>h>]>e>]>d>c>V>k>e>d>]>e>`>b>T>Z>g>^>R>]>f>`>d>\>g>h>c>`>]>c>V>g>b>d>^>J>_>c>Y>b>b>b>]>i>a>_>f>l>^>Z>`>]>f>_>b>j>_>W>l>c>_>`>c>_>_>_>]>_>b>[>Z>>\>]>e>g>b>d>a>c>Y>b>]>b>a>\>\>z>_>\>a>c>`>^>f>h>c>V>_>[>Z>l>^>`>`>]>>>a>]>^>g>f>a>X>[>a>c>l>]>]>e>]>c>]>e>d>e>`>`>]>[>`>d>[>Z>d>]>c>h>e>b>]>`>Y>h>e>e>_>Z>\>[>e>b>a>[>b>X>b>f>\>k>_>_>c>c>]>c>`>b>^>\>a>[>c>e>^>a>^>[>b>e>b>h>Z>a>f>e>h>c>c>n>`>b>`>f>]>]>b>b>`>^>q>_>b>^>\>d>e>e>g>c>i>`>_>d>\>e>]>d>b>e>`>h>g>c>`>g>b>V>d>[>`>a>^>]>j>b>e>m>a>\>Y>c>d>e>d>P>S>c>=[>c>e>_>>[>]>`>d>^>d>`>`>R>c>`>`>[>]>_>\>Y>]>[>a>`>_>e>d>_>c>Z>d>d>_>g>b>\>d>a>[>`>l>d>[>a>U=`>f>]>`>d>#>l>[>a>g>]>c>a>_>`>`>\>_>c>]>e>a>\>\>]>]>d>j>b>h>[>a>_>W>_>]>`>`>`>a>`>p>c>X>_>g>_>`>a>c>]>`>]>g>g>X>h>b>]>Y>]>]>i>e>g>b>]>c>^>d>e>g>]>d>d>]>f>_>\>`>a>^>\>c>^>c>]>g>a>`>d>a>b>g>a>]>\>\>`>\>W>_>g>g>]>^>a>c>`>`>Z>[>a>]>h>c>`>`>^>i>b>b>_>_>^>h>Z>a>_>c>_>^>e>Z>e>c>b>d>^>\>Z>]>_>b>a>\>_>a>a>_>c>c>]>d>_>]>c>Y>Z>g>`>e>`>Y>U>f>_>S>Z>g>[>X>i>`>)>`>d>`>Z>b>_>]>^>d>y>_>a>e>e>`>^>E>f>\>Z>_>b>`>c>a>a>b>_>h>Y>`>e>h>g>a>]>^>f>Z>\>n>[>c>`>^>_>a>Z>b>\>_>a>_>a>f>h>h>^>_>b>i>[>g>b>\>i>`>_>a>]>_>\>^>f>e>c>e>^>k>_>\>d>a>k>g>W>c>_>[>^>^>_>^>l>e>]>b>_>m>`>]>i>a>c>f>X>Y>f>c>^>d>^>[>m>`>g>V>Z>b>m>[>`>b>Z>d>e>g>[>\>[>c>c>`>j>a>c>a>]>i>a>e>f>a>c>Z>a>`>`>^>e>_>[>a>e>^>\>_>a>a>]>X>e>a>Z>\>W>c>]>`>f>h>`>`>]>`>a>e>]>X>g>`>\>a>_>]>f>Z>d>a>c>a>c>Y>h>e>^>i>e>d>c>^>^>i>`>a>`>a>c>^>`>^>a>b>]>d>X>c>b>Z>e>b>g>X>b>_>f>a>e>Y>`>Y>a>g>^>Z>b>b>]>g>\>f>\>b>`>X>^>]>\>f>Z>c>b>_>Z>Y>W>a>Y>]>e>i>Z>f>g>Z>a>e>f>W>f>`>p>l>Z>c>X>d>_>`>Z>]>`>R>c>c>a>d>j>^>d>^>c>Z>`>Y>e>`>_>Z>`>g>d>`>T>Z>e>a>a>^>X>f>b>c>j>b>_>]>]>b>[>\>]>c>_>_>f>[>c>a>[>a>^>a>d>Z>_>`>Z>H>b>\>[>b>g>d>d>c>]>Z>b>e>f>e>a>c>b>\>a>^>d>_>]>d>`>f>c>^>]>`>_>^>e>Z>c>b>h>c>d>d>Z>c>f>h>a>b>b>Z>^>[>_>b>`>`>d>]>e>a>b>e>_>`>d>^>c>c>b>a>X>_>`>^>X>g>c>_>`>d>`>c>]>^>c>d>^>`>[>]>c>^>b>k>c>c>e>_>d>[>f>c>_>a>Z>`>a>\>\>a>d>]>j>W>`>a>_>g>\>d>g>\>^>b>c>Z>f>^>Y>g>_>f>a>f>a>e>]>_>T>Y>c>Y>`>b>]>a>\>^>\>Z>]>c>g>^>f>X>c>]>c>^>c>c>X>c>a>Y>`>`>j>^>b>_>_>a>_>e>a>e>f>^>Z>k>`>\>c>P>_>g>a>j>c>]>`>j>]>[>e>a>d>h>[>a>`>i>W>g>g>d>c>_>U>h>^>a>`>d>f>b>^>b>\>_>\>b>_>`>`>\>h>`>_>e>Y>e>`>d>'>g>`>`>`>^>b>c>^>`>d>[>[>f>Z>X>a>a>d>l>]>c>h>b>c>W>`>d>c>e>Z>h>d>f>c>g>Z>c>d>`>]>Y>[>g>X>h>]>^>`>_>b>`>d>e>`>_>e>_>f>_>\>\>e>b>Z>d>a>a>Y>e>\>a>c>e>_>e>f>[>G>c>\>a>Y>Z>a>a>X>k>_>_>]>h>a>`>W>e>f>a>b>`>f>e>X>]>a>\>_>]>V>`>d>`>]>Z>a>_> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_179.const b/unet/.cache/NhwcConv_0-conv_inConv_179.const deleted file mode 100644 index 21944140aeaae55bc98d39d703bedeb54e9e5f11..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_179.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_18.const b/unet/.cache/NhwcConv_0-conv_inConv_18.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_18.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_180.const b/unet/.cache/NhwcConv_0-conv_inConv_180.const deleted file mode 100644 index 5f9cdb88128e1a53b25b8bc780be7e1fd5aec779..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_180.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2cf1f8016069c29c3779cffc776057793a14f8d861f372fe7de02d442db960f0 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_181.const b/unet/.cache/NhwcConv_0-conv_inConv_181.const deleted file mode 100644 index ad89151be9555c0e006331b1eb74ad10b734dfe5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_181.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e257968fed2ff07f5a47f0247b113edc6ab277dc2258c98551b2bf567faa6f22 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_182.const b/unet/.cache/NhwcConv_0-conv_inConv_182.const deleted file mode 100644 index d623622c072045b828b397826ee4ee4a6b45a8e7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_182.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6d4967339fcfb2b192acdd40bce66ddb1197d0b720eb29309dd589d5eb2b408d -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_183.const b/unet/.cache/NhwcConv_0-conv_inConv_183.const deleted file mode 100644 index 29d7efed7c686e107262751ea39a43a2a921da4e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_183.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d91c011e49914dfb4cea5141ee94ce21d9b1e8230976b9a9f8e8c9e3a9120fe -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_184.const b/unet/.cache/NhwcConv_0-conv_inConv_184.const deleted file mode 100644 index 64bac5b4b5019f1db7f18d241090d158bab066de..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_184.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_185.const b/unet/.cache/NhwcConv_0-conv_inConv_185.const deleted file mode 100644 index 1e7d538bfa1b0472de0be0ac4a66c71dd5d535e4..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_185.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bb63ece2137b04e59f303cab93336af5f6f905b505ceb548b6788db7353931ad -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_186.const b/unet/.cache/NhwcConv_0-conv_inConv_186.const deleted file mode 100644 index 8acfd27ee988e4482213871a71eb3f633cdba024..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_186.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_187.const b/unet/.cache/NhwcConv_0-conv_inConv_187.const deleted file mode 100644 index e08f4707062453163b1cc380b13d170443e3c6b5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_187.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3286c863bb51b153397fc4521cd6dce0c340dbe2daa3837ec201e0b582347d23 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_188.const b/unet/.cache/NhwcConv_0-conv_inConv_188.const deleted file mode 100644 index 4557c62454b5cf1729ea9ef701130be4608ad436..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_188.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_189.const b/unet/.cache/NhwcConv_0-conv_inConv_189.const deleted file mode 100644 index 5015e265e7510b8ffe5adaccb3f19c8c1e992b60..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_189.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7338af3fcef195bb09d7ba134901c2dc6afb3b9aa1746ba39db94ccf7b9eddab -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_19.const b/unet/.cache/NhwcConv_0-conv_inConv_19.const deleted file mode 100644 index 022672cff1dc0365055e95553c0deadfd03d73ca..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_19.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2d25a76b7e747f7206cc546133c04b3bf89a3f77dc9f03e28f91b82400d403fc -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_190.const b/unet/.cache/NhwcConv_0-conv_inConv_190.const deleted file mode 100644 index e34be41dc0a2875b47346d2b2c6d1c916df54d51..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_190.const +++ /dev/null @@ -1,3 +0,0 @@ ->>>>>>>>>a>>>H>>>>>>>>>>>>>v>>>>>?>>>>>>>>>>>>> ->>>>>>>>>>>>>>>>r>>>>>>>>>>^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>p>>>y>>>>>=K>>>>>>>>>>>>>>O>>>>r>w>>>>>>n>>>>>>p>>>>>>w>>>>=>>>>>>>>>>>>>>>>>|>>>>>>>>>>>=>>>>>>>p>>>>>>>o>>>>>>>>>>>>>>>>>>>>>>>U>>>>>>>>>>>>x>t>U>>>>>>>>>>p>>>>>>>>>>>->>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>X>>>>>>>>>>>>>>=>>>>>>>>j>>s>>>>i>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>`>>>>>>>>>>>>>>>>>>>S>>>>>>>>>>>>>>>>>>>}>>>%>>>>>>>d>>>>>>>>>W>>n>>>>>>>>>>>>>>}>>>>>>>>>>>>>>>>>>>>>>>>7>>>|>>>>>>>>>e>>:>>>>d>>>>>>I>>>>>>>>[>>>>>>>>>>>>>s>>>>>>>>>>>>>h>>>>>>>>>>>>>{>>>>>>>>|>>>>>>>>>>>>>>>>>>>>\>>>>>>>>>>>>>>>>>>>>@>>u>>>B>>>>s>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>{>>>>>>>>>>>>>>g>t>>>>>>>>>>>f>>>>>>>>>>|>>>>>w>>>>>>>>>>>>>>>O>>f>>>>r>>>>>>>>>>>>>>>>>>>>>>y>>>>>>>>>s>>>>>>>|>>}>>>>>r>>>|>>>>>>>e>>>>>>>>>>>}>>a>>s>F>>>>>>>>^>>>>>>>>>>>>>>>>h>>>I>>}>>>>>>|>>>c>>>~>>c>>>>>>>>>>>x>>>>A>>>>>>d>>>>L>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>(>>>>>>>]>>>>>>>>>>>>3>>>^>>{>>>>>>>>o>>i>>>>>{>>>>Q>x>>>>>>P>>>_>>>>>>>>>>>>>>>>>>>>>a>>>>>>>>>>>>f>>>>>>>>>>k>>>W>>>>>>>>>>>w>>v>>>>>>>>>>>o>n>>>>>>>>>>>>>~>>>>>>>>>>>>>>>>>?>>>>>>>>>>>>>>>>>>>>>>>>>>>}>>0>>>>>>>>>>>>>>>>>u>>>>>>>=>>>>q>=>>>>>>>>>>>>>>>>}>>>>>>>>>>>>>>>{>>w>>>>]>>>>>>>H>>>>>>d>>>>>z>>>>x>>>>>>>>>T>>>>>>>>>>>>>>>>>>>>>>>>>>>>x>e>>>>>>>>>>N>H>>>>>>>>>>>>>>>>>>>>>>>>>7>>>>>u>>>l>>>> ->>>>>>>>c>>>>>>>>>>>>>>>>>>>>>>>>>>>>p>>>>>>>>>>>>>R>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_191.const b/unet/.cache/NhwcConv_0-conv_inConv_191.const deleted file mode 100644 index 6bd418fe7f0793928697c84262c564c8f2128bf9..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_191.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_192.const b/unet/.cache/NhwcConv_0-conv_inConv_192.const deleted file mode 100644 index bc9ef81bb115510ce133a0dfca734f42e3255aca..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_192.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:365672e126a57c528c29d63a50c8800e9581f32dbdee64d152051d9891a53104 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_193.const b/unet/.cache/NhwcConv_0-conv_inConv_193.const deleted file mode 100644 index 2a9ffa1ff17a0b0d3f7c076e88b733db2a3be165..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_193.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a4a8ad4c26ec6cc11ba9b321b436b760d0bcbc89f51d0ca48208c8259da64cea -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_194.const b/unet/.cache/NhwcConv_0-conv_inConv_194.const deleted file mode 100644 index 37336c93a7ae9899c237b1891f7c8e0194bd33ec..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_194.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8c0bbcef4f7bc2d211e42d21470f7bb34236afdffc3bae6eceac2d68797a8978 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_195.const b/unet/.cache/NhwcConv_0-conv_inConv_195.const deleted file mode 100644 index a05953627f130591ae93cd3e732f37dcf4c6c6b1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_195.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c130884509c9ec008a12b2a0add402fec5bbfe0652022ed1c76718560b338ddf -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_196.const b/unet/.cache/NhwcConv_0-conv_inConv_196.const deleted file mode 100644 index 844c6a8f8311efeb56a86ce4ec358ae43c2acc91..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_196.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>{>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>P>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>a>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_197.const b/unet/.cache/NhwcConv_0-conv_inConv_197.const deleted file mode 100644 index be03cda2602f7e924c76e0d34f56a3e96517efda..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_197.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_198.const b/unet/.cache/NhwcConv_0-conv_inConv_198.const deleted file mode 100644 index fd59f42edf7bbd34e7344ba61091f0952c3280f1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_198.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:dabba40debec6fa18b0556f670ceb8cf6428a0ebf4cf842cd530d54dfa432611 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_199.const b/unet/.cache/NhwcConv_0-conv_inConv_199.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_199.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_2.const b/unet/.cache/NhwcConv_0-conv_inConv_2.const deleted file mode 100644 index 70878de9aa2f5f333dfc85911d7b04f96d5790ee..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_2.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_20.const b/unet/.cache/NhwcConv_0-conv_inConv_20.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_20.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_200.const b/unet/.cache/NhwcConv_0-conv_inConv_200.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_200.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_201.const b/unet/.cache/NhwcConv_0-conv_inConv_201.const deleted file mode 100644 index d6e40f3ef0d1654dab5400bc60e47799cdfa40b1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_201.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1b2d0ecce7160d05d63242a6f4cf12270be2caab568538a41d665f65746bc3e7 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_202.const b/unet/.cache/NhwcConv_0-conv_inConv_202.const deleted file mode 100644 index 30b9a148456f38a87cc348064c1014fd426a1879..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_202.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>R>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>w>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>;=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>~>>>>>>>>>>>>>>>>>>>>>>>M>>>>>>>>>>>>_>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>#>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>l>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>s>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_203.const b/unet/.cache/NhwcConv_0-conv_inConv_203.const deleted file mode 100644 index 4803179baa23d6803fc2993b10ec5163871f3f19..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_203.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_204.const b/unet/.cache/NhwcConv_0-conv_inConv_204.const deleted file mode 100644 index 97fc97624b592ac6f231a2d4fde7543693060dbc..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_204.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6b17db01f2b7898b62b4034d92f96587beccbaf4643c2b26f8368a310afbee04 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_205.const b/unet/.cache/NhwcConv_0-conv_inConv_205.const deleted file mode 100644 index a6b13171a8030a5c59c535a0dc9d7ba718e0edfd..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_205.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:310d5b14b7c0fc679c9d1f0b07a0770751b53870b0115dd6b322328e65f8c59d -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_206.const b/unet/.cache/NhwcConv_0-conv_inConv_206.const deleted file mode 100644 index 692970fba25f88d063e372e3ea73c3118edf2176..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_206.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7f9a151a86eb7c178144ab20dbf67cf1c95a5081e8c8a039ce3cdb35465299a6 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_207.const b/unet/.cache/NhwcConv_0-conv_inConv_207.const deleted file mode 100644 index f59945cc092d4d13f20bc4c8a0995a5e8ff691d1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_207.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7109bf33abf0bac180b8785ac4a0ceb021da70cc8ebd12d8afe68ffe7d6d2842 -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_208.const b/unet/.cache/NhwcConv_0-conv_inConv_208.const deleted file mode 100644 index 5187a83359b6b305d3bd2434560ad2cb42f96575..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_208.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:02f6a4221674475118319fea4d0dd38124042e27d30205424ae4fb067f006ef3 -size 17244160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_209.const b/unet/.cache/NhwcConv_0-conv_inConv_209.const deleted file mode 100644 index 8bc806e85599fc62b636e76c0f5b59f39af04886..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_209.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_21.const b/unet/.cache/NhwcConv_0-conv_inConv_21.const deleted file mode 100644 index 7a116e90c24ecf7445d1f41d8fb3579934851756..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_21.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c0a69a7d164351c913407f0537b99f7f35bf6ad8993fd71fc07cfb333b4b55a8 -size 467200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_210.const b/unet/.cache/NhwcConv_0-conv_inConv_210.const deleted file mode 100644 index d9fe8505c31f651d958581eb84f4f187e99efbb1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_210.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b7717b2f91d77ddde2bc58d07e0abde635ca744cd044e68ff071a9e5af22a309 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_211.const b/unet/.cache/NhwcConv_0-conv_inConv_211.const deleted file mode 100644 index 66981f91d246de1d837e76380a836452e103ae28..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_211.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_212.const b/unet/.cache/NhwcConv_0-conv_inConv_212.const deleted file mode 100644 index b553023c8ca8606db9b1922ace03942f81d5df60..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_212.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:150b176c085685060c4671eba153c29655af2e17a749351e3c1c333d7e0138c5 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_213.const b/unet/.cache/NhwcConv_0-conv_inConv_213.const deleted file mode 100644 index 82863e57f1d17e92feac3262d6bb4a0bfe57daaf..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_213.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_214.const b/unet/.cache/NhwcConv_0-conv_inConv_214.const deleted file mode 100644 index 5e2984a837669bca8835e689deebbc69745a9a8e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_214.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:64dc599aed0d949f0d4d153546d8906102849998ad88bed40ee7d3316dca0a78 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_215.const b/unet/.cache/NhwcConv_0-conv_inConv_215.const deleted file mode 100644 index e2161cb390a5f16bd382a8ff4431bc27d166047f..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_215.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_216.const b/unet/.cache/NhwcConv_0-conv_inConv_216.const deleted file mode 100644 index adca8661473306c35aef117dcb851737bfc8acda..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_216.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e808a24b9bcce1de038adbc6aefbf22573158aeba1bc16c26ccdb3303661b00a -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_217.const b/unet/.cache/NhwcConv_0-conv_inConv_217.const deleted file mode 100644 index e35babc5bdd06b1afb5dfc38f7d61860c050bc6e..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_217.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_218.const b/unet/.cache/NhwcConv_0-conv_inConv_218.const deleted file mode 100644 index da59fc8d19a0d4713a32756ed12add5c41afd021..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_218.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e58868b590a8460d0baafb8e1bc6b989ba630cf61175414df0b8d64ba11c46a -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_219.const b/unet/.cache/NhwcConv_0-conv_inConv_219.const deleted file mode 100644 index 2859db744dc79f463ce400c5efa291896314a09d..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_219.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_22.const b/unet/.cache/NhwcConv_0-conv_inConv_22.const deleted file mode 100644 index be50c9674a4ebbcc717ae0926bc48fc805a7a752..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_22.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f4c72c04a7db25d2fc40ef3590c69225f755db192d86981bc14ae476ca994c36 -size 1077760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_220.const b/unet/.cache/NhwcConv_0-conv_inConv_220.const deleted file mode 100644 index 062efc2a3d0e1987960c5c9f2f4414fd2f23ff2a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_220.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1abc28eb46acec56bdc72bebe796865e2e5f4661ce9f6b54c03ee609eb0cc732 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_221.const b/unet/.cache/NhwcConv_0-conv_inConv_221.const deleted file mode 100644 index 9c6ca02950c939c415eec066c3a59b62b603c83c..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_221.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_222.const b/unet/.cache/NhwcConv_0-conv_inConv_222.const deleted file mode 100644 index e827930f862e2c3e1200d2227116c5e2eff42a74..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_222.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cee4a0e331ed8c7443fe2afe0de8bd9f49a0039f139d78d9e0f37ede28211deb -size 2048000 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_223.const b/unet/.cache/NhwcConv_0-conv_inConv_223.const deleted file mode 100644 index 0240d7a4db1545155f717bcca1060acf344960bf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_223.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>y>e>x>>>>>>>|>>=>>>>>>|>>>>>o>L>>>>>\>>>>>>>>>>>c>T>>z>>{>>>v>>>w>>>>>>>>>n>>>>>>>y>>b>>>S>>T>~>>>>}>>>>y>>f>>>>>>>>=>>>\>>>>>h>>>r>>>d>V>>>>>>>>>>>x>>>>_>>~>>>>z>>>>>>|>>t>>>q>>>>>>>>+>>>>>|>j>>p>>>>>3>>s>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>k>>v>>>>>>>>>>>>>>>>>>Z>>>>>>>>>>s>>>>>>>>>>>>>>>>>j>>>>>>>>>>>>c>>>>>>>>>`>>>>|>>>F>>>>>v>>9>>>>>u>>>>>R>>>>>>>>>S>>>>>>>g>>>W>>>>>>>>>:>>>>>>>>>>>>>>>>>>|>w>>>L>>>f>l>>|>>>>}>>>>>>>>>>>>>>i>>>>>>>>>v>>>>>>>>>>>>v>>>>>>>>>>>>>>>p>>>>>>>>>>S>>>>>y>Z>>>>>>>v>{>>>r>>>>y>>?>S>>>S>>>y>>>>>>>=>>>>>n>>>>>>>>>>>>}>>>>>>>>}>>>_>>>y>>>>l>>>>>>>>>>Z>>>j>>>>>>>H>>>>[>k>>>>>>>>>>>>>>>>i>>>>>>>>>>t>>>>n>>>>>>>Z>>>w>>>>>>>>>>>>>>>>>>>>Y>>>>>>>>>>>>>>>y>>{>>>>>>>>>i>>>>>q>>>S>>>>>>>>>>>>>>>Q>>h>>j>>>>}>>>>>x>P>>>>>>>>>>>>>>>>>>>>z>>>>>a>>>">>t>>>>>>>>>>>t>>>>>>>>t>>b>>>>d>>>>=~>>e>>>>m>w>>>>>>>>>>>>~>>>>>>>>>>y>>>l>>k>w>>>>>>>>>>>5>|>g>x>>>>>>v>>>>>D>p>i>>=>>>>>>>>>>>>>c>>>>>>>>>|>>>>>|>>>>->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>R>>>>>>>>G>>>>>>}>u>r>>>t>>>>>>>>>>>j>>\>>>>>>>b>>>>>>>>p>>>>>>>>R>>>>>>>>>>>>Y>z>>>>>z>>}>>>>>>b>}>>>>>K>r>>>>>>>\>>r>n>>a>j>>>>>O>>>>><>O>>>e>>E>>>>>>s>p>>>>x>>E>m>u>>>>>u>>>o>>>>>>>>>>>>>>e>o>>>>>>>>~>>>>>>>>>M>>>q>>>>^>>>t>>>a>=>j>>>>>>>>>>>>>>>>>Y>>z>k>>>>>>>>t>{>w>>>y>>>>b>>^>>>>>>>>k>>>>>>>>>>>>>>>>>v>>D>>x>>n>>={>>>>>>>>>>>>>>>>>>>>s>>>>u>>>>>>>>>>>Q>>>>>>X>w>>>> >i>>>>>>>>l>t>>>>>>>>>>>>>>o>>>>>>e>>+>>>u>y>>>>p>>>>{>)>>>}>s>>>n>>>>%>>>r>>>U>>>>>>>>A>B>>>>k>k>>>>>>>>>>>h>c>>>>i>>>>>>>>>>>>>>>>>>]>>>>X>>v>>>>>>>>>>>>>>>>>>>h>>>>h>>>>>>>z>>z>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_224.const b/unet/.cache/NhwcConv_0-conv_inConv_224.const deleted file mode 100644 index 0240f761083ee21cbdc9ae4423fef8f13af5ed11..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_224.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_225.const b/unet/.cache/NhwcConv_0-conv_inConv_225.const deleted file mode 100644 index 8c0b14a251335bb958245589fb2aa192465391f0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_225.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:257c4b9c75e6a2c665232a742d894a0210ac911d455a4f0008a04b480bf9a611 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_226.const b/unet/.cache/NhwcConv_0-conv_inConv_226.const deleted file mode 100644 index 394923b0801e29efe028f7bbe90e7927b8ba68e6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_226.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:49329a9d9647e00ed031c58a123b87eb41ba1d50011d0ca92019375a2e0393c7 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_227.const b/unet/.cache/NhwcConv_0-conv_inConv_227.const deleted file mode 100644 index 7bf9e308889dd430792ce1dc0ad7593b0150f9ca..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_227.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f7f9a7b655ad445d6dabc49866356c83d52db539f44e2d32b65a88439ff7c49b -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_228.const b/unet/.cache/NhwcConv_0-conv_inConv_228.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_228.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_229.const b/unet/.cache/NhwcConv_0-conv_inConv_229.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_229.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_23.const b/unet/.cache/NhwcConv_0-conv_inConv_23.const deleted file mode 100644 index 17cde4d6baaffa15e6a16c9217db70cf0c0e97b8..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_23.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_230.const b/unet/.cache/NhwcConv_0-conv_inConv_230.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_230.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_231.const b/unet/.cache/NhwcConv_0-conv_inConv_231.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_231.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_232.const b/unet/.cache/NhwcConv_0-conv_inConv_232.const deleted file mode 100644 index 9a4efdba6e2adf24788826f2a0709396b3cde55f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_232.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f8b0260d31b85b16ab9825a97b3de188bf39f5ae11faac8441973750095586a8 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_233.const b/unet/.cache/NhwcConv_0-conv_inConv_233.const deleted file mode 100644 index a717933c020512f2e70ecf95e8fa7f122ad774e3..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_233.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_234.const b/unet/.cache/NhwcConv_0-conv_inConv_234.const deleted file mode 100644 index 650cd01b3abf741a939128eb9aa59db330d2b2b3..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_234.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_235.const b/unet/.cache/NhwcConv_0-conv_inConv_235.const deleted file mode 100644 index 9a5a2218314ef501906d81efca966f6b979a05d1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_235.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:41da0d24ad227a48519c4dab4a1ce8d54ba3008422cc291b44029287c0b2468c -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_236.const b/unet/.cache/NhwcConv_0-conv_inConv_236.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_236.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_237.const b/unet/.cache/NhwcConv_0-conv_inConv_237.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_237.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_238.const b/unet/.cache/NhwcConv_0-conv_inConv_238.const deleted file mode 100644 index eb3a0010ec33395bf0b1538514718bd78ad7f630..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_238.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a0c8f954f60fb9cd7361147932cbda67a86fe2a630ca10bcae6b191650927f6a -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_239.const b/unet/.cache/NhwcConv_0-conv_inConv_239.const deleted file mode 100644 index ca010022e173b887cbdc5c5759cdd789e8509a2e..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_239.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_24.const b/unet/.cache/NhwcConv_0-conv_inConv_24.const deleted file mode 100644 index f20c52884e8e9c0089e5254028ea30f9240e487e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_24.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7a1eec0226383de9a8a6c73daf84bfc4257469ead557238a050b292f094523d2 -size 1077760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_240.const b/unet/.cache/NhwcConv_0-conv_inConv_240.const deleted file mode 100644 index 98b87a724446bd3529c56b830b57abe88e96de12..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_240.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_241.const b/unet/.cache/NhwcConv_0-conv_inConv_241.const deleted file mode 100644 index bd5a42675ab8728f4a96a91aaf141655a23fbe2c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_241.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ce590ef7c6556ec88625040317bb8bee8dd1815047f80f0df0f6d4560305320c -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_242.const b/unet/.cache/NhwcConv_0-conv_inConv_242.const deleted file mode 100644 index a3c2ebb388b7fb7ce835f5d72ee21ac94ce702b2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_242.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ff5c7546cbd2a62a1ce1bd84f6abf4dea359ee025e98aa4bb3a800748b5bd428 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_243.const b/unet/.cache/NhwcConv_0-conv_inConv_243.const deleted file mode 100644 index 58232ae86720f4ae0427d4263e7633a14c133b3b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_243.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0a12208dd7584ce580c94d44e3afe8c776ca7749a7e4e70f404db3dd2f721437 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_244.const b/unet/.cache/NhwcConv_0-conv_inConv_244.const deleted file mode 100644 index af31a6ee8ba879535dd95192742ba14d9046a322..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_244.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c5b8a8792c62e87d3f68c2422e5324d28d5b0cc74548919bd6630f87d79947ed -size 2048000 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_245.const b/unet/.cache/NhwcConv_0-conv_inConv_245.const deleted file mode 100644 index 09f8f952d35e249328e9ad0597f7c6eb51f0a407..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_245.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_246.const b/unet/.cache/NhwcConv_0-conv_inConv_246.const deleted file mode 100644 index 748e18877996a1883c9798b45ea2e52fc478037d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_246.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5434a806d4c0ce45651b194bead5586b3695377ad82655be2605ee428ee24660 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_247.const b/unet/.cache/NhwcConv_0-conv_inConv_247.const deleted file mode 100644 index bd20f9b68fb01627db31b8f1bb277abceb7e4ac0..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_247.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_248.const b/unet/.cache/NhwcConv_0-conv_inConv_248.const deleted file mode 100644 index a52a968be82dfe4214f1550bf43444da4e6b33fc..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_248.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:27e0007f0ad3221e36766fa99c183ff3f2a34be1a055b624d37cb6ddf1fe6339 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_249.const b/unet/.cache/NhwcConv_0-conv_inConv_249.const deleted file mode 100644 index 7dcae43bf7e8385fc2669b0127c21aa23d836888..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_249.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_25.const b/unet/.cache/NhwcConv_0-conv_inConv_25.const deleted file mode 100644 index de842572f486c17d1f23b808d99d09e5a1c16d78..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_25.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_250.const b/unet/.cache/NhwcConv_0-conv_inConv_250.const deleted file mode 100644 index a169dd207f4d44b9b59c7193959bbfcde228699a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_250.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c8cdf8474190d8f3983640b51bef1f210006b42fbbbdfdf5c4e493d06a9e87b4 -size 33832960 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_251.const b/unet/.cache/NhwcConv_0-conv_inConv_251.const deleted file mode 100644 index df951dfcf2b692d97558d37ba77bfd2dc9535de9..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_251.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_252.const b/unet/.cache/NhwcConv_0-conv_inConv_252.const deleted file mode 100644 index 5419cd23bbaee95affec4cdc12f064c4b89a3dd1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_252.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4bc82f1334639e1de24ee01f2b83e44a6195ec6adbb5e6acb1e1afc7625a0afb -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_253.const b/unet/.cache/NhwcConv_0-conv_inConv_253.const deleted file mode 100644 index 238befd58ecade5f136348355c7b23c1a6d8bd59..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_253.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d29931783ca87b829f7601b4f8bb47a9da242b225efc637356532a00945163d2 -size 4096000 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_254.const b/unet/.cache/NhwcConv_0-conv_inConv_254.const deleted file mode 100644 index 4ba0cda535e0fe5c554f4835f76aa4fd131fae1f..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_254.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_255.const b/unet/.cache/NhwcConv_0-conv_inConv_255.const deleted file mode 100644 index 55b1438e23a61f5f9eeb6d3668c200dfe3a33d29..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_255.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a06f15282a2abd796916eac42e75878bf9dcbc226d7497fbf3f46100caf9ca52 -size 33832960 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_256.const b/unet/.cache/NhwcConv_0-conv_inConv_256.const deleted file mode 100644 index c5e6e96ac929b9bf6b7c7e6973c372610e40eaf5..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_256.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_257.const b/unet/.cache/NhwcConv_0-conv_inConv_257.const deleted file mode 100644 index 00e592869f2e9d3e396e078abb3dc422868a48f7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_257.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b09e0c4c107aaab8c1ffc0ae6d90a59157192f330fccb61c0fe6b95a8243a7bb -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_258.const b/unet/.cache/NhwcConv_0-conv_inConv_258.const deleted file mode 100644 index a1cdc3222f014b116aa43574ef0acaf92d879101..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_258.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e3d054706581c747cf7dc13c109b27b78655bf1ba2f9730e3b51203710b5a35 -size 4096000 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_259.const b/unet/.cache/NhwcConv_0-conv_inConv_259.const deleted file mode 100644 index aa19c28a9d65e00c2d685fe95663f4b2515791d0..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_259.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_26.const b/unet/.cache/NhwcConv_0-conv_inConv_26.const deleted file mode 100644 index 4898597046842bf9cea1ad2b4040c5ec6bc4f5d9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_26.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e88011f7d3c1a8623bcf5b361590040d8cb1f50d90fe643df8a46fe659bd0f4 -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_260.const b/unet/.cache/NhwcConv_0-conv_inConv_260.const deleted file mode 100644 index 32600647aef5d107622f9a7e033f13ef35e60ea3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_260.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:32be16856de20eb0da921dfc4e34f74c30f05028a2d54398db40ab75c879b80a -size 33832960 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_261.const b/unet/.cache/NhwcConv_0-conv_inConv_261.const deleted file mode 100644 index 4f2845c05845e9711cf6cd66cbbe9708bbec8a19..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_261.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_262.const b/unet/.cache/NhwcConv_0-conv_inConv_262.const deleted file mode 100644 index b1a5d586aa4f4f6dc36f6657da85d3c8906618d9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_262.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b973a9741c4629e176545fd231a45580c6751da24f583665310f380370387cd1 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_263.const b/unet/.cache/NhwcConv_0-conv_inConv_263.const deleted file mode 100644 index 5c0951d974b24c9c7913f14773b02c946aadd174..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_263.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b27fcb75071198f9707e383b04b6cd03bed3af50053a7195c5b00a9d65538740 -size 4096000 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_264.const b/unet/.cache/NhwcConv_0-conv_inConv_264.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_264.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_265.const b/unet/.cache/NhwcConv_0-conv_inConv_265.const deleted file mode 100644 index bc384f2e3c4b25035c77b076ff8d73fb7261a05d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_265.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:50cb410d9d4d6ce6bf936958bb92784433158ef9bc41a2050404e3cae17a56cc -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_266.const b/unet/.cache/NhwcConv_0-conv_inConv_266.const deleted file mode 100644 index b8577c98ff911a0d415ceb31f2854203bb1b48d1..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_266.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_267.const b/unet/.cache/NhwcConv_0-conv_inConv_267.const deleted file mode 100644 index be381384fb0c3d2cadc442b58358e816779e8656..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_267.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e0194912b35412cd30fd4945bc348f0d5e1b60555db0a7f0ad115f561ec3fe8 -size 33832960 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_268.const b/unet/.cache/NhwcConv_0-conv_inConv_268.const deleted file mode 100644 index a32722a81329c6d720521e61613630563da0c0ff..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_268.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_269.const b/unet/.cache/NhwcConv_0-conv_inConv_269.const deleted file mode 100644 index f20b60f0674eb51d66f520f9e96c0149511d55c2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_269.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:229627597893f0cedce4f34ec3263b7687e3407f86e0a48a8fb9be31eac09a56 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_27.const b/unet/.cache/NhwcConv_0-conv_inConv_27.const deleted file mode 100644 index db2054f0c682ddce19071543e97292e32d9db41b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_27.const +++ /dev/null @@ -1,4 +0,0 @@ ->??9???>?>=?@? ?3??2?6?D?>>P?,?>6?>0?>-????.?(??%?&?>7?>1?>?0?>? ?>&?>??>>!???>Y??#???>?*?>9?>-?I??C??@???:??>>(?G?/?'?>?$??%?>@?>)?!?>>'?F??0?-???>-?0?>? ??*??0? ?>??#??? ?-?3?>??@??>%?7?-??;??0?>?G??G??4?&??>>??"? ?>?>$?0?A?:?4?N?#?%? ?H?>?#? -?7?>5?;?-?'?'?$??>>+???=??>>)?0? ? ?A?>>?>? -??6?.??? ? ?>>?>>>>#?!?4??*?'?>??>M?1?+? ?4?(??D?@?>.????????%?,?0?*??/?2?>Q??>@?)??C?0?$?)?>,?O??>D?,?>,? ?>>0?>?(??>A?>?*?;??>?>?"?>D?F?>&?/?)?8?4?/?'?$???.?9? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_270.const b/unet/.cache/NhwcConv_0-conv_inConv_270.const deleted file mode 100644 index a37fd01cc6dcf3aee9b175ce90d4d2925798eee6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_270.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:487029c181659e230f68af0d807b7297140cf16dddf1e259d979c58ad6152009 -size 4014080 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_271.const b/unet/.cache/NhwcConv_0-conv_inConv_271.const deleted file mode 100644 index 49feff97bfb1bf8ba0572522975057a5c5ce6346..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_271.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_272.const b/unet/.cache/NhwcConv_0-conv_inConv_272.const deleted file mode 100644 index 7875b3795759eb84fe6a6951ad66ecedee4487d7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_272.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e9f7e6ca4b837c0bf981eeb489653454501742ba29f7eff0dead7e9916b84c0d -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_273.const b/unet/.cache/NhwcConv_0-conv_inConv_273.const deleted file mode 100644 index e915c8a49af8fc703d7d43fd035f590a5b47afeb..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_273.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>8>>>>>>>>>>c>>>>>>>>>}>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>/>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>p>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>_>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>E>>>>>>>>>z>>>>>>>>>>>>>>>>>>>>>>>>>>>>N>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>j>>>>>>>$>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>v>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>`>>>>>>>>>>>>T>>>>>>>>>>>>>>>>>>>>>>>>>>>S>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>q>>>>>>>>>>>>>>>> >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>i>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>1>>>>>>>>>>>>>>>>>>>>>>>>>>=>>a>>>>>>>>>>>k>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>v>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>V>>>>>>>>>>>>z>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_274.const b/unet/.cache/NhwcConv_0-conv_inConv_274.const deleted file mode 100644 index 47856ae43c72823f391005fe05ead540f088d7dc..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_274.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_275.const b/unet/.cache/NhwcConv_0-conv_inConv_275.const deleted file mode 100644 index 1c87be8b83ef80e4602757cf40eb13e38ec7f45f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_275.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c97d813cd2cb28054162dc167ef543760953d513de1f1aa892681cf918cc9b35 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_276.const b/unet/.cache/NhwcConv_0-conv_inConv_276.const deleted file mode 100644 index 87c594fc45a4b99711b7db98e2708e7f4db23869..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_276.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f63353081ba9ccb540206e7ae77de43ad5af761cbfbffcd149d474ebbc279c89 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_277.const b/unet/.cache/NhwcConv_0-conv_inConv_277.const deleted file mode 100644 index 6c92ca0006da21569322a5b51887ec2b274236d3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_277.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0a3e0808b3e876259db857df9944abc2da818d3000cfe237fe59a4db035afd99 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_278.const b/unet/.cache/NhwcConv_0-conv_inConv_278.const deleted file mode 100644 index 199c7cc2ec9e652281a8da00ede4a66e4ba69296..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_278.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:35fc391c3648bb87b1a3bc0ff03ded46d19c92a53d72e7001f60fabee42d41e2 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_279.const b/unet/.cache/NhwcConv_0-conv_inConv_279.const deleted file mode 100644 index 117932fbf038ead32fdde946bee93be9de435201..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_279.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_28.const b/unet/.cache/NhwcConv_0-conv_inConv_28.const deleted file mode 100644 index 44fee57ec336db0b8cc19ce1ff11a3348ba03666..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_28.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_280.const b/unet/.cache/NhwcConv_0-conv_inConv_280.const deleted file mode 100644 index c6218a0b52d1d05dde0ab5062b6e7c39f275d781..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_280.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_281.const b/unet/.cache/NhwcConv_0-conv_inConv_281.const deleted file mode 100644 index ed8d06be91a9a5cf33dab78705e19c19b66fe6ef..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_281.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b1798c033e794e2beec32c69083d50d1a47836080f43d9e4fa7b409af66167b9 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_282.const b/unet/.cache/NhwcConv_0-conv_inConv_282.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_282.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_283.const b/unet/.cache/NhwcConv_0-conv_inConv_283.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_283.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_284.const b/unet/.cache/NhwcConv_0-conv_inConv_284.const deleted file mode 100644 index ebc397d918096dde68d43a0505cb29608983bb8c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_284.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5b2e8a6d44b6866a7673c64e763a99d777839b5aad6eaee8a6103b0f8903ad5b -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_285.const b/unet/.cache/NhwcConv_0-conv_inConv_285.const deleted file mode 100644 index 3a14cc8983ac43f1e567a744ee137ea350b2c1d4..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_285.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>J>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>e>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>N>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>@>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_286.const b/unet/.cache/NhwcConv_0-conv_inConv_286.const deleted file mode 100644 index c5cc4bc1f0632a3acf2d16d5afb7efb47fd9b4a3..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_286.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_287.const b/unet/.cache/NhwcConv_0-conv_inConv_287.const deleted file mode 100644 index f43640b1adf2375f782a4c724e522bb9e52ea95e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_287.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:73bc8699f11d7f18a33f44e74372d157e9e747e18039091f1582e71d4011bcd2 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_288.const b/unet/.cache/NhwcConv_0-conv_inConv_288.const deleted file mode 100644 index c76b54d81572db33cd1b25dcb9cae3fd94734a5c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_288.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3adfdae670cec91a3ebf994a89a14936b696e7b85aa5ddd8fbeae7040cfddfe2 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_289.const b/unet/.cache/NhwcConv_0-conv_inConv_289.const deleted file mode 100644 index ba69164bcd0482102479dc1befe1c60d83a454a0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_289.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4286051d79b3153f549bda71fd1e05cc9c293514000a425a719f6e204e4cd94b -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_29.const b/unet/.cache/NhwcConv_0-conv_inConv_29.const deleted file mode 100644 index 659ada2b0f5a1935192505e7fc40bb2d35143863..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_29.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:63f7d4415e2ecee861e5ce149d2f36ebc6e5b5455373e46269a559dccaca5c87 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_290.const b/unet/.cache/NhwcConv_0-conv_inConv_290.const deleted file mode 100644 index 820d8dd6cf82489594806f3b60c395a543a54ccf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_290.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:49563a6271355cc9b6b004d704859ea7d14ab2c1a9b0e4e5195f62622e65cd5d -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_291.const b/unet/.cache/NhwcConv_0-conv_inConv_291.const deleted file mode 100644 index f1552bd86b4010909daf5d15dbd65a5ccdef9621..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_291.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_292.const b/unet/.cache/NhwcConv_0-conv_inConv_292.const deleted file mode 100644 index 4b52f83edce36d416b89c82199c92ea74374334e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_292.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:314866d6aa86932e1665f4643a35101de127b545dca6eb2bb6bd4cba32b92010 -size 33832960 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_293.const b/unet/.cache/NhwcConv_0-conv_inConv_293.const deleted file mode 100644 index f72ac3d4869e27b1983c19714eac7636a18ab4da..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_293.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_294.const b/unet/.cache/NhwcConv_0-conv_inConv_294.const deleted file mode 100644 index 1ab928eaa3a08ff2763566112c15679884a045e1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_294.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:96d3ce9059004f228c4158b361bc1bc73c8f8fed6c72d3e73b7363ff1ffcd2a1 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_295.const b/unet/.cache/NhwcConv_0-conv_inConv_295.const deleted file mode 100644 index b0f9e60647f979e33c2218c1158824b75bd0e33e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_295.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7c21f75c5c7413d4a5096822d1f9c836d3a770d18bf85eb6a94092299c032988 -size 4014080 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_296.const b/unet/.cache/NhwcConv_0-conv_inConv_296.const deleted file mode 100644 index 092fd3008fd1a598ad0b3dba08b520edc3938e77..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_296.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_297.const b/unet/.cache/NhwcConv_0-conv_inConv_297.const deleted file mode 100644 index 91a07a89a398b031f53dc8f95b07fad8d8320aa5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_297.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:33e8f5dd0bb0310d779fc5d52b40f48eb9ef3bdd41dbbf9e2c72e62e70fff2c9 -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_298.const b/unet/.cache/NhwcConv_0-conv_inConv_298.const deleted file mode 100644 index be6715b45d7da9c78c64b657ce7dc6a19cb6caff..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_298.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>=>>>*>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>d>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>M>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>6>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>a>>>>>>>>>>>>>>>>>>>>>>>>>>>>>/>>6>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>}>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>u>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>m>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>i>>>>>>>>>>>>>>>>>>>>>>>>>>8>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_299.const b/unet/.cache/NhwcConv_0-conv_inConv_299.const deleted file mode 100644 index 45a6eaf59eac7ebf9ce225218fc040061772d72a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_299.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_3.const b/unet/.cache/NhwcConv_0-conv_inConv_3.const deleted file mode 100644 index 903b7383354b3b641c526f2ad06586c1c21e2c4a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_3.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f538f981bd0db466140a14207d18ae4a42ee7738a95ec30c57c778b760c596db -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_30.const b/unet/.cache/NhwcConv_0-conv_inConv_30.const deleted file mode 100644 index 0c3cc351a3be351d5b36a15b5b1c8a042cc9c07c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_30.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3c5ac06faf0f9a95ad2cce8a8ee6434e8272c3ae3620c22a2bb736f88bbaa551 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_300.const b/unet/.cache/NhwcConv_0-conv_inConv_300.const deleted file mode 100644 index a1789f8d2091b1c0525b8c74a6a359544612c2ed..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_300.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:969aaba1b10358dd53e33779f03b8969ff06f9784483a6ce5167f776c48ec96c -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_301.const b/unet/.cache/NhwcConv_0-conv_inConv_301.const deleted file mode 100644 index b4e20a136b9a1a75f318359fe39fea82b14ffeea..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_301.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:714bd88299a39e75cf124a08783e0c6c7a1a93bcbe32513ede2f4dada37beef9 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_302.const b/unet/.cache/NhwcConv_0-conv_inConv_302.const deleted file mode 100644 index a85a9d07823fe2b072d2dd673d7f71a4eb6a34ea..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_302.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:15ffca060de24b3c6cdff75e9d6160cbe5bfc57313a079bbbbf2feae7fe32a93 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_303.const b/unet/.cache/NhwcConv_0-conv_inConv_303.const deleted file mode 100644 index 3016416808d9edc8e1d084b0a6707a779e5d1abf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_303.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:667af7a898de53c915714c9ed22547800076bbc6d2216309d7e201c94a6eb60c -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_304.const b/unet/.cache/NhwcConv_0-conv_inConv_304.const deleted file mode 100644 index a1957236dd9bce57c98c74b7e4682a6099f80053..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_304.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_305.const b/unet/.cache/NhwcConv_0-conv_inConv_305.const deleted file mode 100644 index dbde20b0a7551284a987a761876a327aaebe0b67..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_305.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_306.const b/unet/.cache/NhwcConv_0-conv_inConv_306.const deleted file mode 100644 index 44a94cb087f46ebae7c9270b6833e7f2468d9ae0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_306.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:def4a65e2719da256a4cb047f8fca1c70f5cc6c7bf94d9c920e6b5127eff3818 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_307.const b/unet/.cache/NhwcConv_0-conv_inConv_307.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_307.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_308.const b/unet/.cache/NhwcConv_0-conv_inConv_308.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_308.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_309.const b/unet/.cache/NhwcConv_0-conv_inConv_309.const deleted file mode 100644 index 1912df5640f577d1d76eb861836f6f94ca7b2168..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_309.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:60434fc4d97232f9af18ec9f5a1e100fcc592d16bf34879bc3bf94942840fe77 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_31.const b/unet/.cache/NhwcConv_0-conv_inConv_31.const deleted file mode 100644 index bd2fbbd5560ffa943cf53a177ff77983ed841ecf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_31.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:542427be7b5e666a10a01928c7a3b1676b7546e0a02b377b13c9b49f7a6368a3 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_310.const b/unet/.cache/NhwcConv_0-conv_inConv_310.const deleted file mode 100644 index 48b4bd6f4b68d47ef59da4adaae520143088747a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_310.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>=>>>w>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>f>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>r>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_311.const b/unet/.cache/NhwcConv_0-conv_inConv_311.const deleted file mode 100644 index 88c0a1fc1eee7cd43b176362a353a67ad6268b59..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_311.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_312.const b/unet/.cache/NhwcConv_0-conv_inConv_312.const deleted file mode 100644 index b5c77bfc1d54a34374cd7464072fec689da986c6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_312.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f50e3429fb0cb192a5e92cba327c21092f26d69b4634aebc639b0e76c7ae5df8 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_313.const b/unet/.cache/NhwcConv_0-conv_inConv_313.const deleted file mode 100644 index 28de21d3349103516cb1cdf91ceff30f44f65fdc..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_313.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6eb88d4a514a41e9ab84cfc1e5b89eba86b30b077853fd66795eddc9185506db -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_314.const b/unet/.cache/NhwcConv_0-conv_inConv_314.const deleted file mode 100644 index af8f800f9a31ef74ed3a2b77daa3b2d00e3d93cf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_314.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c308efa8752b60a1f9ab5b8ebb84adb8f1c9085e654a7e4a1a077c60effebb94 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_315.const b/unet/.cache/NhwcConv_0-conv_inConv_315.const deleted file mode 100644 index 7d7bc98ea440d621fc861cf1b12035d638acaa58..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_315.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:26f231b20b08a5c3b2275ecc1deec44b163ee057efcbb2429e24bb2024a69174 -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_316.const b/unet/.cache/NhwcConv_0-conv_inConv_316.const deleted file mode 100644 index 81a8b94d7f83d44a0408a76ebf4d78d06b0cf37b..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_316.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_317.const b/unet/.cache/NhwcConv_0-conv_inConv_317.const deleted file mode 100644 index 7cc55861b0c460cf1696c052fb1f115f8dbb1c6a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_317.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bf5d9115785e2fe5caf9da1f6d44b96135a5907e01596ba04c1344e43700cfc3 -size 25374720 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_318.const b/unet/.cache/NhwcConv_0-conv_inConv_318.const deleted file mode 100644 index 88ecf4f79a56fcb2d917a968bea8c5838fd5b8f4..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_318.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_319.const b/unet/.cache/NhwcConv_0-conv_inConv_319.const deleted file mode 100644 index 4d07d5aa06116564318207b08354b52430c75c47..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_319.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2149fd9ed125d273cb509ccf316ae5d91cd52e745f2197c8c13a4107b5bbb282 -size 16916480 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_32.const b/unet/.cache/NhwcConv_0-conv_inConv_32.const deleted file mode 100644 index 8a03cdf97422c37ec4ca61c61ac4a4586adfbed9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_32.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e78840ef73708e6a5e017f193b7b2d1ba8f983cb03f96af51fa61e58f7703d9 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_320.const b/unet/.cache/NhwcConv_0-conv_inConv_320.const deleted file mode 100644 index f5ba7669a9f2d90655e5945beb776901346d6176..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_320.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4f53d196cc3ec2a979bdde36b3c5524c6a72800e80e74612e86ffa42358ff926 -size 3010560 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_321.const b/unet/.cache/NhwcConv_0-conv_inConv_321.const deleted file mode 100644 index 0a69fbf6392d8f32c75334b4fc78c05825ce55bf..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_321.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_322.const b/unet/.cache/NhwcConv_0-conv_inConv_322.const deleted file mode 100644 index f937ea1b7190d6bb21b35d863d160196dedb287e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_322.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:29fb85ab9da54b211a48a8eb4e9812aa8a046bcdbf8ce598c28b2ec62ac97c82 -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_323.const b/unet/.cache/NhwcConv_0-conv_inConv_323.const deleted file mode 100644 index f715a30cdaf7e75e9ff30b50e606a4512abf07f0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_323.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>y>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>e>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>}>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>8>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>?>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>^>>>=>>>>>>>>>>>>G>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>v>>>>>>>>>>>>>>>>>>>e>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_324.const b/unet/.cache/NhwcConv_0-conv_inConv_324.const deleted file mode 100644 index 1d6e8622f5352ea995421a685c1677de6147b2c4..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_324.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_325.const b/unet/.cache/NhwcConv_0-conv_inConv_325.const deleted file mode 100644 index 183f9d9da602e1da35955c2b2bea774e5d4e0b4e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_325.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:89b24f519d2308e4b9e22fb40760588b7cb289216f51b60e75954a9aceaa2884 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_326.const b/unet/.cache/NhwcConv_0-conv_inConv_326.const deleted file mode 100644 index a183948ad5d6f4ef05a7c7966c5c6492657b6487..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_326.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5ee20a3aaac641664f8101f7f938a038ad14b3bca1ba3ed27567631a026b0a5f -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_327.const b/unet/.cache/NhwcConv_0-conv_inConv_327.const deleted file mode 100644 index 3c13d0911ddd654c6f0a9f4f50df33f997544ca1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_327.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6b8a2d4533b7e4a2e46eb06cb919f86a64f9bd580e542f1ad5f03a912ab5b844 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_328.const b/unet/.cache/NhwcConv_0-conv_inConv_328.const deleted file mode 100644 index 7b9f0264182d8cf487fd76295a2465e40ad1c7c1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_328.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:eedf41387edfa950ef225f7a20d435fb8fc6d0c7e817f6b2569202b5c7ac3bc4 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_329.const b/unet/.cache/NhwcConv_0-conv_inConv_329.const deleted file mode 100644 index 30ee4d14681ca52037eb9c662b1ca9c5ac05d1d7..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_329.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_33.const b/unet/.cache/NhwcConv_0-conv_inConv_33.const deleted file mode 100644 index 0f8eabea53368f61479ffd22b5b3e5c729ee1850..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_33.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_330.const b/unet/.cache/NhwcConv_0-conv_inConv_330.const deleted file mode 100644 index 055dbec58c20fc0006b360051327058b28000f46..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_330.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_331.const b/unet/.cache/NhwcConv_0-conv_inConv_331.const deleted file mode 100644 index f6e9de9e97cbce07894cb47dc703ebc9b2624162..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_331.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f161dda8d21ec33ed4988276ef243beee627bc8f6d7a6fdb0406ceba1e38cc3a -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_332.const b/unet/.cache/NhwcConv_0-conv_inConv_332.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_332.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_333.const b/unet/.cache/NhwcConv_0-conv_inConv_333.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_333.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_334.const b/unet/.cache/NhwcConv_0-conv_inConv_334.const deleted file mode 100644 index d4393c485ce6972a7c4c3f7b9886a9a9b214f8e3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_334.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c52f5f1f5741daf9cb679fde7954cbfd7bda5b564966f9d748cbe0efc1606604 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_335.const b/unet/.cache/NhwcConv_0-conv_inConv_335.const deleted file mode 100644 index d12d6d3e4663e989610c432f4b4be0b997e06130..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_335.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>%>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_336.const b/unet/.cache/NhwcConv_0-conv_inConv_336.const deleted file mode 100644 index 5383f73bb4a8b080fea941a991e701ae80fca921..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_336.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_337.const b/unet/.cache/NhwcConv_0-conv_inConv_337.const deleted file mode 100644 index b29096abb3b42d7c63144ac6b92d259c2d251f53..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_337.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cd8e1749758760d97900c5ef9eb50c83a3c1ce6c01258ad41586a68a05fd1eef -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_338.const b/unet/.cache/NhwcConv_0-conv_inConv_338.const deleted file mode 100644 index f628f65b3e61005f8170943bf330f065285ba4fc..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_338.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:13a6dded82e3745e5124e78cb542b1353224d5078675b9c3e6cf6288332f7a00 -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_339.const b/unet/.cache/NhwcConv_0-conv_inConv_339.const deleted file mode 100644 index dc026d078089bc6f09921e3e30c5b22c1b4c188e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_339.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9e1feb2f6a2f6be51d5bff78e636a06517f82286b3562ba5bb99f69e3925a7f -size 7475200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_34.const b/unet/.cache/NhwcConv_0-conv_inConv_34.const deleted file mode 100644 index ef26ac79019e5f601de6262a0ffb8440282c525b..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_34.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_340.const b/unet/.cache/NhwcConv_0-conv_inConv_340.const deleted file mode 100644 index ded3d38ec5af50ab1158936c91df86ea0504b1e3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_340.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e52a90266558d587b186274ed601ebbfb834febd93c9f5b246876aaa603240ff -size 2007040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_341.const b/unet/.cache/NhwcConv_0-conv_inConv_341.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_341.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_342.const b/unet/.cache/NhwcConv_0-conv_inConv_342.const deleted file mode 100644 index 55657d1dfd96732a8e710a3265baedb2c3f53e5c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_342.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c3cdbf14f3c10ac6bd344f0cfbd73f91f19338abac94f3bb758c1e32cd4e656d -size 17244160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_343.const b/unet/.cache/NhwcConv_0-conv_inConv_343.const deleted file mode 100644 index 127d34d87f162324035839c86947ef666f48cc04..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_343.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_344.const b/unet/.cache/NhwcConv_0-conv_inConv_344.const deleted file mode 100644 index 4ccab2b6d5e263b903045c87acf1be8c2f1a2fe0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_344.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:40a2917fffb924f771c0eaa67eb9341aef2bb67068a1d8b4f0e17b3412064ec0 -size 12851200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_345.const b/unet/.cache/NhwcConv_0-conv_inConv_345.const deleted file mode 100644 index 2c136dbbafc0966f977e340ecd2626ec64868b16..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_345.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_346.const b/unet/.cache/NhwcConv_0-conv_inConv_346.const deleted file mode 100644 index 5485c60c52c04cf97adc66297ef54ac276edccda..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_346.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:49763bae56f010b35019d233a3323e6cd32c79ad9e8321354a1aa575d62728af -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_347.const b/unet/.cache/NhwcConv_0-conv_inConv_347.const deleted file mode 100644 index 4aa2870b129e62525b27fba7aa8e0ed4dcfe67d9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_347.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:570cd9fcc2d70f738d664b3c30ffe9bef0eaea25bbf74f971645790b81e7dd34 -size 1505280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_348.const b/unet/.cache/NhwcConv_0-conv_inConv_348.const deleted file mode 100644 index a378900f5a3546b38012ddbe266a223bd458d83c..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_348.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_349.const b/unet/.cache/NhwcConv_0-conv_inConv_349.const deleted file mode 100644 index 59f37548098db620ed6c0307d60168e7e1dc7b17..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_349.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5896acd5835f1dc1891e61f5a5c813f163e33b0697f61b534d7c6e6ab44fe65f -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_35.const b/unet/.cache/NhwcConv_0-conv_inConv_35.const deleted file mode 100644 index 5e574c12060904f40509b88fc1b30df684f722a3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_35.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:38784c86bcdc5dc06a03c8d92be32b440197ab1a11ce90859f689943a7f4445a -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_350.const b/unet/.cache/NhwcConv_0-conv_inConv_350.const deleted file mode 100644 index fd11ab27269f1a6f393e67a2bd8f01b468fe21b5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_350.const +++ /dev/null @@ -1,2 +0,0 @@ -4?H??;?L?C?B???0?)?G?=?@?7?Q??8?F?>?1?2?B?C?F?8?6?M?-?F?1?6???0?A?1?>??'?5?>?/?G?>>?*??2?D?U?>??2?C?O??F?0?0?/??C?1????3????K?9?6?6?5?>A?;?N?>?I?F?0????0?1?[?8?L???#?E?2?N?B??-? ?9?4?B?K?(?*?;?0?E?0?4?E?:?L?Q?Y?P??/?V?8?'?>=?!?@??7?2?/?%?D?>?/?B?@?>0?6?3?&?E?>E?>?6?)?4?@?1?2?F?>E?6?A?=?5?3?H?'? ?>$?0?F?:?7?C?@?2?>9?G?'?2??M?%????M?8?'?D?>>.?F??I?>?/?G?>>>?8?2?E?>?D???7?1?0?4?0?-?]??>&?7?1?)?.?2??>8?"?.?8?0?9?K?8?1?>?#? -?B?>?3?:?.?=?E?5?A? ?5?2?C?@?5?9?/?:?5?P?C?5?0?A?F?N?(?A?=?6?/?F?J?A?9??/?B?0??!??.?C?1?E?J??6??2?6??Q?9???O?M?>%?0??6?2?7?8?>?6?3? ?2?-?=??A?:?5?=?H?2?@?=?9?=??K??9?.?%?-?;?&?:?X?M?A???+?3?2?7?0?*?0?J?0?/?0?B?5?8?9???;?/?L?7?1?@??.?%?-?D>?=?1?D??F?(?7?4?????1?>P?H??7?R?-?> ?B?A?1?I?>5?D?N?1?!?K?0??9?0?@?'?4?A?$?2??/?D??2??7?1?/?9?L?F?0?(?1?4??#???=?0?'?E?9???@?L???/?)?(?>>)?0?;?'?J? ??3??;?>>)?5?!?5?%?O?> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_351.const b/unet/.cache/NhwcConv_0-conv_inConv_351.const deleted file mode 100644 index 28ff3e1e31962472611e998b50bb0c87ae17af2e..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_351.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_352.const b/unet/.cache/NhwcConv_0-conv_inConv_352.const deleted file mode 100644 index d0590b7e3fb466309041ea6caf100d08d2e1f648..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_352.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:aae3782904dd80e3a4f02076d31c1f4766373dda4993b7edaef8803baaac6995 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_353.const b/unet/.cache/NhwcConv_0-conv_inConv_353.const deleted file mode 100644 index 71fcb486c52c6653c3ead276dce56b40baf1cfa8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_353.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c1284ecb6f6202efd16dc2f35c957e0af73575b248ba534b9546647b40ba8d5b -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_354.const b/unet/.cache/NhwcConv_0-conv_inConv_354.const deleted file mode 100644 index 7599c01c9602da887e932351caec601f384ea0e0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_354.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7c15902f702827883ff788405e0d54f0becaf9b24c96fc0c15e678bcbf8ea98e -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_355.const b/unet/.cache/NhwcConv_0-conv_inConv_355.const deleted file mode 100644 index a71a26508cce55f0176b4ba2b3d0d8938ed2ea91..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_355.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:09870dd6dea741895bc22db9f9a7cdb7be3e0968ee38772d4f1fbf03d79e0ded -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_356.const b/unet/.cache/NhwcConv_0-conv_inConv_356.const deleted file mode 100644 index 0557884ecb20383ff64cfb1ea5dd67f6bd322f46..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_356.const +++ /dev/null @@ -1,2 +0,0 @@ -%?4?(?0?3?(?%?G?!?1?'?0?!?A?*?.?)?2?9??&?,?,?4?#?4?$??0?,?@?W?>?%?.??-????1?8?2?0?%?"?#???7?3?:?S?3?3?B?-????=?&?'??7??3?>1?#?*????+?$?,?9?.?)??3?-?3???I?.? ?&?6?5?"?7??.?"?>'?%??9?4?7??6? ?/?4??2?2?0?2???#??9?H????1?)??=?3???1?&?3???8?0?5?4?*??!?2??;?*?"?2?>+??/?%?+?*?=?0?/???%?0?/?>??C??:? ?5?'??,??!?%?3?2?0?9??/??3?/?,??4?1???&?3??!?+?:?3??0?*?4??!?0????5?/? ??0??3?&?"???!?,?'?3?:?*?3??2?+?3??;?(?)?? -???'?B?>0??,?2???-??/?%?,?,?(??8?F? ?4??1?,?,??6?2?#?.?? ?$?0?'?(?#?B?(?"??/?>0?*?8?0? ???4??5?2??4?+? ?$?>??*?(????&??+????9?+?4??(??9?$???>E?-??"??>%????5?"?.?0?*?1?*?8?"?:?)?? ??$?3????>?0??5?"?,?3?4?$???D?>??&?*?1?0?9??@??$?0?,?;?(?A?3?:?4?+?9?)?(?2?#?!?#?8?1?-??9?4??(?&? ? ?? ?%?!?3?A??)?3?)?)?>?4?$?,?*?$?9?$? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_357.const b/unet/.cache/NhwcConv_0-conv_inConv_357.const deleted file mode 100644 index d03e95744e2c0763ad5dcd247a3d7b663bfb0d32..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_357.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_358.const b/unet/.cache/NhwcConv_0-conv_inConv_358.const deleted file mode 100644 index 79d4ad70b09c0075d288d4076166d68684f2695e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_358.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:89c2c25bedaf5d5feb82e3ae9936e502031920eae56c697bdd6cfcf7a44f3eff -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_359.const b/unet/.cache/NhwcConv_0-conv_inConv_359.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_359.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_36.const b/unet/.cache/NhwcConv_0-conv_inConv_36.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_36.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_360.const b/unet/.cache/NhwcConv_0-conv_inConv_360.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_360.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_361.const b/unet/.cache/NhwcConv_0-conv_inConv_361.const deleted file mode 100644 index 5d1c6209d31822cfdab470f01a324da2396b18b2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_361.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:10381a01a7ec8a7915be515d9f3a00e7895136048b69948333b32bbfd793e844 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_362.const b/unet/.cache/NhwcConv_0-conv_inConv_362.const deleted file mode 100644 index 3a93ca1f8ee169deef9a3016d66a01172527035c..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_362.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_363.const b/unet/.cache/NhwcConv_0-conv_inConv_363.const deleted file mode 100644 index 0fa96d4b19c077aebaeabfb0c2997cf00f73c9e2..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_363.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_364.const b/unet/.cache/NhwcConv_0-conv_inConv_364.const deleted file mode 100644 index 393123abe44d3f157af68220a64933f7f96f6fed..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_364.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a755f1e75231c73c000b6cce44a1f72265bf451b5e44dc8d807b2e48bd6ca791 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_365.const b/unet/.cache/NhwcConv_0-conv_inConv_365.const deleted file mode 100644 index a4b4192d88ce44e8a27bfd06d5d3260480ec2888..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_365.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d5fd6c74fdfad3a74e7405d9596c46fadcd48c7638f51a2dd0aaa5be2a5fb6bd -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_366.const b/unet/.cache/NhwcConv_0-conv_inConv_366.const deleted file mode 100644 index 1748731e168758dddc7fca0a7453484421d3e097..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_366.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fe16e116fee0002aa99d319b892c9e452cd0e3f2bdf122c5871ca20fff8d227b -size 1884160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_367.const b/unet/.cache/NhwcConv_0-conv_inConv_367.const deleted file mode 100644 index c29cdcbff57103ed6967160a35243d2cdb49d67f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_367.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a99ab993dc4cf9f9224ce53b8c00ca290d9f8451fd4bb17d9a6c330523ece04e -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_368.const b/unet/.cache/NhwcConv_0-conv_inConv_368.const deleted file mode 100644 index d40b7f09092db33ef3d6d6fc9404541d6734ecbe..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_368.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_369.const b/unet/.cache/NhwcConv_0-conv_inConv_369.const deleted file mode 100644 index a7e00cc9b0df93f099733d997383d023816c0c0d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_369.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e68f74f77bac9b6489677b7792da922337d599a30ac31323ed77df2af2f3bdc3 -size 8622080 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_37.const b/unet/.cache/NhwcConv_0-conv_inConv_37.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_37.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_370.const b/unet/.cache/NhwcConv_0-conv_inConv_370.const deleted file mode 100644 index c7686bff3c4cb532748cabd5ba1faf74c6d82326..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_370.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_371.const b/unet/.cache/NhwcConv_0-conv_inConv_371.const deleted file mode 100644 index 700dda77a0a323ff49f7fad687034e50635c7da9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_371.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:abf309a1154ff1bac71274c64f0b1275d40b8b050f08559498dd9b0f869561df -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_372.const b/unet/.cache/NhwcConv_0-conv_inConv_372.const deleted file mode 100644 index 568a819ee523cd94840020004b69fa58bd52ab8d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_372.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:08f730a910684153a19a5bc7cdee34a380de8ef9b2f4384f11832058476dd474 -size 1003520 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_373.const b/unet/.cache/NhwcConv_0-conv_inConv_373.const deleted file mode 100644 index 9d56490444e066ca4ec1ef729acaee1bd9e101ba..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_373.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_374.const b/unet/.cache/NhwcConv_0-conv_inConv_374.const deleted file mode 100644 index 7d32d490c7753a5359a7c776227628bd88ccb78c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_374.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:51bda076edc7400fd9cb5056bf54323d3f5df5d91a26ef7cf3ba7f7062fd2e4b -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_375.const b/unet/.cache/NhwcConv_0-conv_inConv_375.const deleted file mode 100644 index 7f5b05ced47d598282926313ee70beb72717cdba..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_375.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_376.const b/unet/.cache/NhwcConv_0-conv_inConv_376.const deleted file mode 100644 index b619d30fc87d59a77a1600c3555370f161d2ffc9..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_376.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_377.const b/unet/.cache/NhwcConv_0-conv_inConv_377.const deleted file mode 100644 index a345e1dcc2c237c48431e2b32a9923065b0f7075..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_377.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0a8791d7d9f6a92e20b4c5d6e820ddcd928f92e48ea0f9bb08e84e204315a41b -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_378.const b/unet/.cache/NhwcConv_0-conv_inConv_378.const deleted file mode 100644 index b53b9a59649795596f6256aa57e601272a1cc91c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_378.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:56b2e8ea76f48b6038bb131c3276fcf7735f2a34fb2107612f4f63eee54e7faf -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_379.const b/unet/.cache/NhwcConv_0-conv_inConv_379.const deleted file mode 100644 index 4dd4f18cc73a9088ccded984149975a3df3baa68..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_379.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b1e736fc0f748eff72f7a9ad7ddb97493748fd0be832dbddca5f04317cc8a6df -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_38.const b/unet/.cache/NhwcConv_0-conv_inConv_38.const deleted file mode 100644 index 96b17603c3ca9c865be616ab4253690a173c347a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_38.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e4c7f06093a7e43b5f7c1bc272355b333acea04b3c92e0a6645988f0ac2d02a8 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_380.const b/unet/.cache/NhwcConv_0-conv_inConv_380.const deleted file mode 100644 index e31431e911e1e44696458b96037f954e877d2247..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_380.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:31a207b2ced14b81bffa3fefbdd4ced6ed18a05982046c23fdd788c96f87d069 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_381.const b/unet/.cache/NhwcConv_0-conv_inConv_381.const deleted file mode 100644 index 8130f4266fe865e21e200c76d8392eb3a4c3f6d6..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_381.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_382.const b/unet/.cache/NhwcConv_0-conv_inConv_382.const deleted file mode 100644 index fa9336b26fcad741852824ca802ac501fd6e5698..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_382.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_383.const b/unet/.cache/NhwcConv_0-conv_inConv_383.const deleted file mode 100644 index e870450ed2a4e1c4c2cb7d1be4049e4e7e0376bf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_383.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3f27e3ad7a577ef9f71352df173a42b3e69f06188c3d3dc4ca3e2ecce0fcc560 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_384.const b/unet/.cache/NhwcConv_0-conv_inConv_384.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_384.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_385.const b/unet/.cache/NhwcConv_0-conv_inConv_385.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_385.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_386.const b/unet/.cache/NhwcConv_0-conv_inConv_386.const deleted file mode 100644 index 38cefa2ddd6def562ea25847c1de58bf37a13d75..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_386.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e9f6b17b8eec0d52aac645134e3e7f0c10b061193d2935f16ee6c5f9bf0c0093 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_387.const b/unet/.cache/NhwcConv_0-conv_inConv_387.const deleted file mode 100644 index 8c71064ac6a1cd30c5031e443143bc1a1564a558..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_387.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_388.const b/unet/.cache/NhwcConv_0-conv_inConv_388.const deleted file mode 100644 index 74ac8f0f53fd520e731b9405142bdeb5a75b4550..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_388.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_389.const b/unet/.cache/NhwcConv_0-conv_inConv_389.const deleted file mode 100644 index 328ca92304d450bbc44133465021b6bc1bb4ae8c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_389.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9dd16fbf9ec1482329007693a877b9e1a16a71e79e2bd84d063b31beb4a3a9c0 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_39.const b/unet/.cache/NhwcConv_0-conv_inConv_39.const deleted file mode 100644 index 3dba8ff93afe73e24ddf494d1f2b518cc701d2f4..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_39.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_390.const b/unet/.cache/NhwcConv_0-conv_inConv_390.const deleted file mode 100644 index 51f04f3bb1258b9345b933bdf1089edeab0d6eb5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_390.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:38e31a25a0d96870397ee43b5cddbdfff3550a016e3cf98096f1a4448aced09d -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_391.const b/unet/.cache/NhwcConv_0-conv_inConv_391.const deleted file mode 100644 index 6280b727d7d152b25c557584c23bde11c0dd17ed..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_391.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:57e8ccf37cae739ebeddfb7adb29e70319d197f4a5840e4df0b05c0ba55f8633 -size 1884160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_392.const b/unet/.cache/NhwcConv_0-conv_inConv_392.const deleted file mode 100644 index ea884a49dc27386f0d00c10b0bf0d57929d9f990..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_392.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e20ae01e96219c275b58a6c6bd4622ad8d72ec64a2cb3d3581aaa7bb5e19bd5b -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_393.const b/unet/.cache/NhwcConv_0-conv_inConv_393.const deleted file mode 100644 index 9f1102a6b3f03e2417440d75cae0506d6fc3fe28..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_393.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_394.const b/unet/.cache/NhwcConv_0-conv_inConv_394.const deleted file mode 100644 index 0447abe14bfac605f07b3fd9756d966b07d43a33..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_394.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d266ee3f90ce143f41268c1372b4ef6116b9ef12892679da804871983e8fd7fb -size 6425600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_395.const b/unet/.cache/NhwcConv_0-conv_inConv_395.const deleted file mode 100644 index 5623b1bbb3839504bf2430dcd497a38b148edab6..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_395.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_396.const b/unet/.cache/NhwcConv_0-conv_inConv_396.const deleted file mode 100644 index 926eed40509b48f47e08b3ec58f3112b4f85414a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_396.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f2da3f822375c66167819bb951f39624ee2ac4deb3f887992551128a4413cc8f -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_397.const b/unet/.cache/NhwcConv_0-conv_inConv_397.const deleted file mode 100644 index 163ef9fdac4438adbb29511f7577865b8f1e91fa..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_397.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:429ad5cdf463a051c3843f4da4203267b132328a7c867474ed0cbfb2e156032d -size 752640 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_398.const b/unet/.cache/NhwcConv_0-conv_inConv_398.const deleted file mode 100644 index 5b18862c370fb89b7d4622bd645f89442f44cb46..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_398.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_399.const b/unet/.cache/NhwcConv_0-conv_inConv_399.const deleted file mode 100644 index bb086ad56980fd8675e65dac1ef22f2cbd46cd23..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_399.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c885daa26d808802620b991898a1b1f17a3476de4f0276705b5f69e70ffda3e0 -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_4.const b/unet/.cache/NhwcConv_0-conv_inConv_4.const deleted file mode 100644 index 90a65d210caa1825bfc3c6cb14e93ad8d7348bda..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_4.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3b909bdf14b70ea0e1fc998922f5691223471f14fac3ffb33dec856687ee8a16 -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_40.const b/unet/.cache/NhwcConv_0-conv_inConv_40.const deleted file mode 100644 index cb80ee1b6ca84d86212c2a0a6c388f6ac50a7f77..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_40.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_400.const b/unet/.cache/NhwcConv_0-conv_inConv_400.const deleted file mode 100644 index caf1c8bcdd0c3c9fa73fbcc1e26ad02eb82dc355..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_400.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_401.const b/unet/.cache/NhwcConv_0-conv_inConv_401.const deleted file mode 100644 index d58dcddf14f1d96a0e14f9409c346876a4f49f5a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_401.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_402.const b/unet/.cache/NhwcConv_0-conv_inConv_402.const deleted file mode 100644 index 2f8a9d85e0f7e20de071ae7eed1bc4f9d4867c37..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_402.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:742ead6f3702ed562290aa359115770263f3a48122d1c89c5eb02d01581cfa3d -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_403.const b/unet/.cache/NhwcConv_0-conv_inConv_403.const deleted file mode 100644 index 5d4c7507bb405e220af0eb634ae23f5d0b840ee0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_403.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d44766cdd8cbab03955256fd5290c47424c65e508aac4906a671e2a73f0e4bc7 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_404.const b/unet/.cache/NhwcConv_0-conv_inConv_404.const deleted file mode 100644 index 7f1dbfd257692aee054b6cdb84df29c9aacf2dbf..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_404.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:797648fbb30b303d155db28e22d75cd505244f0122018f45958aefc114c8d46b -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_405.const b/unet/.cache/NhwcConv_0-conv_inConv_405.const deleted file mode 100644 index bf0935c05d520f6c500ffa246aecfc81643e27bd..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_405.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2f49f0497c8825f282d22888bbe22b9b0564173c654b1600b6f8d3036d612bae -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_406.const b/unet/.cache/NhwcConv_0-conv_inConv_406.const deleted file mode 100644 index c3eebdb12d2af749b0b0d870b36234d08856d1a0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_406.const +++ /dev/null @@ -1,15 +0,0 @@ -?????#??(??????? -???????????????????"?? ?????? ??$??????????>??????? ?#?? ??????>?????? ???? ????? ?"???????????>??????? ?????????????>??????$?????> ? ?? ? ?????? ???????>?????? ???????#? ? ?????????????? -????????? ???? ?????????"????? ?????????????????>????? -?????????? ?????????????? ??????'?>>????????#?????????!?!??????%????#?????????>??????????>? ??????????!????????!???????? -???? ?? -??????>%?? ?*???? ??>??!?!?!??>!???? -???? ??>????? -????????? ?????????????>??????????????? ???>?"??? ? ???>??????????? -???????>????????> ??????????? ?? ?? -?? -?$??????!??? ???? -??????? ?%???????"??!???????????#????????>????$??? ? ??????????? -??????!??????????(????? ?????? -?? ??"??>)????? -?>%????? ?? ???? ??????????????????????????? ???? ??????? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_407.const b/unet/.cache/NhwcConv_0-conv_inConv_407.const deleted file mode 100644 index 5e221fdf47a3fbd177abb6b35d29933e20908ecd..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_407.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_408.const b/unet/.cache/NhwcConv_0-conv_inConv_408.const deleted file mode 100644 index bab76577d3d6c77c6a9b62e98fcb0db82ed6e438..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_408.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ee22ea7111fee9421123ed87a78fd3b6b35d95803ae99ace0bbe599696636cb6 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_409.const b/unet/.cache/NhwcConv_0-conv_inConv_409.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_409.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_41.const b/unet/.cache/NhwcConv_0-conv_inConv_41.const deleted file mode 100644 index eea5ef854a1902f4cb7272b75a78f77f2b10f7e2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_41.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:60bb29afd5b80e6e7f238471340513ae44bf0ab76f8de52b8f6c003bdf93b26a -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_410.const b/unet/.cache/NhwcConv_0-conv_inConv_410.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_410.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_411.const b/unet/.cache/NhwcConv_0-conv_inConv_411.const deleted file mode 100644 index 6c7f8c3d72d3f5bc45678eb04517fa3065980967..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_411.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7dec255f035bdf0f18f94cedc7b7daa69e7b508845085101a0e1fb8a7177d314 -size 473600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_412.const b/unet/.cache/NhwcConv_0-conv_inConv_412.const deleted file mode 100644 index aaa0aa09df3f7337fe81fb00f45fb31ad65615dc..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_412.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>o>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>z>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_413.const b/unet/.cache/NhwcConv_0-conv_inConv_413.const deleted file mode 100644 index 2c428c619f864fc022541db5f385153b28aa9f2a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_413.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_414.const b/unet/.cache/NhwcConv_0-conv_inConv_414.const deleted file mode 100644 index 514eb5560ab7603dde82725f8c311eb226b6f132..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_414.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a0bd5d13ec2532bcfa4726ff8a186e00d4a787f0114babcae52a9f6f626f6b81 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_415.const b/unet/.cache/NhwcConv_0-conv_inConv_415.const deleted file mode 100644 index dd1a5cc4512ae490ccc7210d718168451d327318..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_415.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ba6c5211283bc0179a24240a78ce088640c79f6df2ecde470e4b0e4cb33c159a -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_416.const b/unet/.cache/NhwcConv_0-conv_inConv_416.const deleted file mode 100644 index f3077cfa6bea770dfe377fee56b181a3c7fc024b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_416.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4c05ff49ab128d82f57691d01a844f3e254da05f7b92d14f02fddf79bdf2a391 -size 1884160 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_417.const b/unet/.cache/NhwcConv_0-conv_inConv_417.const deleted file mode 100644 index e015818567bc310764984d7a3a35804a812e45b1..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_417.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3daf53fbcb991a52743d3349ef4d961e6aca6e5e70c9becdb046a97d92a8ab03 -size 501760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_418.const b/unet/.cache/NhwcConv_0-conv_inConv_418.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_418.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_419.const b/unet/.cache/NhwcConv_0-conv_inConv_419.const deleted file mode 100644 index f284b81b0bab2945215ced91375c2a3c8fbf03fb..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_419.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:edd02b258ec6ac2a7b98819ed95b5ea930b5e57be8c866d6d23baf43e98e4c93 -size 4311040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_42.const b/unet/.cache/NhwcConv_0-conv_inConv_42.const deleted file mode 100644 index 1956693232e60975a73b632062efa5dff09cd6c3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_42.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fbe0b48aa568257546a957a87d3083a1b9b6283bdc82eddcfb920b3b8b0ac140 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_420.const b/unet/.cache/NhwcConv_0-conv_inConv_420.const deleted file mode 100644 index af1e99cbbca86c224486b0965b9b52a715cbc643..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_420.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_421.const b/unet/.cache/NhwcConv_0-conv_inConv_421.const deleted file mode 100644 index a556e9fae7e8e94e39c19398dd256eb31e11a20c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_421.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2907ec80d9d60ae121d65126cd0b0dbfd25e81aa950e5a5d296846e16dbf64e8 -size 3212800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_422.const b/unet/.cache/NhwcConv_0-conv_inConv_422.const deleted file mode 100644 index 75ad57ebe97f07f772c7d3d1da45cbc40434272a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_422.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_423.const b/unet/.cache/NhwcConv_0-conv_inConv_423.const deleted file mode 100644 index 3558679a174f9f52064cb3ee4fe1841fe3903317..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_423.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:60379c4cab27038f521a563ddb1e51a7b894ab340fc8ce9528c7b8b23bacd321 -size 1077760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_424.const b/unet/.cache/NhwcConv_0-conv_inConv_424.const deleted file mode 100644 index 5afc9c117aaf0257b52532d3576852f8a2d73ce8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_424.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d68861ac904d248d6a202b5b6a7b34b0b377d3cc97ba4573f0e0c61a06dc01ad -size 376320 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_425.const b/unet/.cache/NhwcConv_0-conv_inConv_425.const deleted file mode 100644 index 08e540bb79b9403786382aebba5ca1f5cc1aad9c..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_425.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_426.const b/unet/.cache/NhwcConv_0-conv_inConv_426.const deleted file mode 100644 index 56d03734e552d8674681d48a37faa0a58d9e5a3a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_426.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:977ba4d98d779cd28ab33f05cb79f2f732b64c21a11665ab6c90b635492d990f -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_427.const b/unet/.cache/NhwcConv_0-conv_inConv_427.const deleted file mode 100644 index 1fdeb35b7451a9e3fc57293a463baf58e814745d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_427.const +++ /dev/null @@ -1 +0,0 @@ -?T?p?z?0?O??l?4??????o?V??k??p?q?Y?m?r?p??:??:??l?O?a?P??e?K?Z?k?M?`?V???\?;?p??p?p?X?c?Y?"?d?N??0??H?f?4?D?>o??_???`??b???w?v?s?0?q?{?_??M??/?h?q??3?R?/????p?{?|??? ??M?D?`?X?z?J??*??E?>|?:?b??R?f??]?q?^??H??A?-?X?z?1?O?L??^?N? ??{?V?p???o?o?n??n?p?9?f?P?P??t?}?o??$?5??P?`?_?>?T?t?c??b?v??{?>>8??s?>?>?M?l?y?M?]??X?c???-?O??f?J??A?1?k?_?|?>?p?w?v?g?P??c?>~?r???L???g?Q?L?|???y?j???X?V?x?|?>X??>?=?'???R?Q?N???s?]?}?*?j?"???V???&?k?G??}??s?5?O?y??M?l???H?2?U??O?Z?;?:?P??.? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_428.const b/unet/.cache/NhwcConv_0-conv_inConv_428.const deleted file mode 100644 index 563a1ca34b12911050a811dbf9aab03493eaa593..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_428.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_429.const b/unet/.cache/NhwcConv_0-conv_inConv_429.const deleted file mode 100644 index 5d1bf4c1e7d67060393c724515705cd7290e4682..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_429.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9fb71f06a03724310d23a10527d535b17d6cacbfd52426e4b8077f54769b94dc -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_43.const b/unet/.cache/NhwcConv_0-conv_inConv_43.const deleted file mode 100644 index 94a5e3bbfd84cf1861a97206f8316735ca06dd74..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_43.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:686d4a591d05d1eeb7edfdf46fe3cf39f694060f7768e4f30e2b7bcbbcdd3af0 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_430.const b/unet/.cache/NhwcConv_0-conv_inConv_430.const deleted file mode 100644 index 66ff5d319b3db97bff568cfe68a32b72d6cc7369..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_430.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:427ae84663d12201b200aa1dc8ec218af5aaf5af389829aa1d34b1fe31bbde3c -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_431.const b/unet/.cache/NhwcConv_0-conv_inConv_431.const deleted file mode 100644 index 660679e56662c7f6091c0dc4ec0448356e153987..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_431.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b1541e657c08d1cdab2bca0f4705916fe117b6ba208ce1ebfe3d0e2d516da27a -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_432.const b/unet/.cache/NhwcConv_0-conv_inConv_432.const deleted file mode 100644 index f42bfd7143d46b498576a99b6c41097f15a84678..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_432.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4fecb9c6804e62ba748a7f1b7556599e7831a2769190b3ba94ce905b36ee2b86 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_433.const b/unet/.cache/NhwcConv_0-conv_inConv_433.const deleted file mode 100644 index 41590294b663235991fd9658dcd714d2fc3b2dc8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_433.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>D>>>>>>>>>>>>>>>>>>>>>>>8>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>V>>>>>>>>l>>>>>>>>>>>>>>>>>>>>>>>>>{>B>>x>>>>>>>>>>>>>>>>>>>>>>>>>>>V>>>>>W>>>>>>>>>z>>e>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>l>>>>>>>>>>>>>>>>>>>>>>>>M>>>>>>>>>>>>>>b>>=>>>>>>>>>>>>h>>>W>>>s>>>>>>e>>>>>>>>x>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_434.const b/unet/.cache/NhwcConv_0-conv_inConv_434.const deleted file mode 100644 index 6d166e345f6a00eab6e0f61296a5b3fb0af13852..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_434.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_435.const b/unet/.cache/NhwcConv_0-conv_inConv_435.const deleted file mode 100644 index e07e3c837dd856e1e69d36c8c8116c77cd80cd90..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_435.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:3ede1bf33751490f0e1989ac17be4d8f07d34c75a036b86bccdc39247184f782 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_436.const b/unet/.cache/NhwcConv_0-conv_inConv_436.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_436.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_437.const b/unet/.cache/NhwcConv_0-conv_inConv_437.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_437.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_438.const b/unet/.cache/NhwcConv_0-conv_inConv_438.const deleted file mode 100644 index fed0634b48fbc438a9efb29ad1f5a4e88380fbf7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_438.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9fd154fe3d16d572bdd47ee68612582befd7c7dd5195c407f3f1aa8d60b7ec5e -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_439.const b/unet/.cache/NhwcConv_0-conv_inConv_439.const deleted file mode 100644 index 936c0a6c48a8363bbe1f1e35c0807da7ebe98634..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_439.const +++ /dev/null @@ -1 +0,0 @@ -[?j?K?^?R?^?M???E?,?P?X?F?L?R?W?C?=?O?9?;?G?3?`?P?`?R?=?;?!?C?N?&?M?K?^?X??Q?6?N?R?d?j?5?+?G?G?7?.?@?>W?>?.?*?X?F?R?R?J?=? ?A?1?P?T?X?P?-??H?S?B?Y?J?d?\?F?=?P?M?D?A??,?\?>?.?S?#?.?_?Q? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_44.const b/unet/.cache/NhwcConv_0-conv_inConv_44.const deleted file mode 100644 index aba20c4c1eb06b30885b644f1983ce5f97e2f4e9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_44.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:39d5fd935c0ecf1c05e21839d79379bfc425da924a44ba401f84295cfcddc8ca -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_440.const b/unet/.cache/NhwcConv_0-conv_inConv_440.const deleted file mode 100644 index f81e984ad31ecddb705a0b1a56107434d983fb6a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_440.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_441.const b/unet/.cache/NhwcConv_0-conv_inConv_441.const deleted file mode 100644 index e6ac994ecd59e0d5f6e9a4c831b5cea6e6a9bc20..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_441.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:718cefbf20c21a856a97e79e0ce8e1afa78d5ce21ce3ef335ecf677b00112dfd -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_442.const b/unet/.cache/NhwcConv_0-conv_inConv_442.const deleted file mode 100644 index babb97ac664f32d554da19b227b9a3390db24841..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_442.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4050bf203f6a4603377f6f3f26c729f13e36ff624d76e0a7d253c8530a008f1a -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_443.const b/unet/.cache/NhwcConv_0-conv_inConv_443.const deleted file mode 100644 index a1da921eee443b1ef6950252d6cfd206e670a05f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_443.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:61ff6d2d806d1f92a6221d8fa1a4da66f182e96a7e73e28c992700b3891f0f6d -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_444.const b/unet/.cache/NhwcConv_0-conv_inConv_444.const deleted file mode 100644 index 2e93e9e14edd1d769a0b1a018402326ad13521d3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_444.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:adc17b451e905af6e9d4aea262e109f7315d88280386e678636f4688767fead2 -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_445.const b/unet/.cache/NhwcConv_0-conv_inConv_445.const deleted file mode 100644 index 6be095f31ce33a61fbb95f377afdca1fb26a2a98..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_445.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_446.const b/unet/.cache/NhwcConv_0-conv_inConv_446.const deleted file mode 100644 index 3e5fa430273837ed5dbd9a9c09b0e0cd7bc44d0c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_446.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c7c9deb366a9f3d38e99e242f25b6d9be9000c0fc76a0395131df5a09f951759 -size 2155520 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_447.const b/unet/.cache/NhwcConv_0-conv_inConv_447.const deleted file mode 100644 index 4809fa6f1d9485b13ef51b2787b439370bae60e9..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_447.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_448.const b/unet/.cache/NhwcConv_0-conv_inConv_448.const deleted file mode 100644 index 4728203fc8dc49de663bbb96c9530db6336011e6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_448.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f9deb8517ac75cd389942b6b97c2c9cfa9edb976cde6db13f82e55d1c9fc4830 -size 1077760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_449.const b/unet/.cache/NhwcConv_0-conv_inConv_449.const deleted file mode 100644 index ec628d5910746caa4244fe8f198a538dabdf570c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_449.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:1e76d842eb6649e51d1c55e021941e2adb31aa1ebcbff0e49a53d892e50eda53 -size 250880 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_45.const b/unet/.cache/NhwcConv_0-conv_inConv_45.const deleted file mode 100644 index 191c89b4852ce7da318e9a8d69a7cb74e175f652..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_45.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_450.const b/unet/.cache/NhwcConv_0-conv_inConv_450.const deleted file mode 100644 index f7d0b9b310a0b03d6aa7012d59a85b96a463c94e..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_450.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_451.const b/unet/.cache/NhwcConv_0-conv_inConv_451.const deleted file mode 100644 index 2d25e7185a16729c5637f7a81d81469e040548a8..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_451.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c66707e5d4a33dd45af789f4925e932f078e6e7a9da6088f956830083e2a2442 -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_452.const b/unet/.cache/NhwcConv_0-conv_inConv_452.const deleted file mode 100644 index 0bae715181f7108520c57ee0d28ff151f63adfe3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_452.const +++ /dev/null @@ -1,2 +0,0 @@ -[?R?o?N?/??4?X??;?M?t?Y?Y???!?????R??G?N?d?1?B?n?`?j?O??>?t?Y?u??H??p?r?`?2?`??c?.?0?c?8?a?s?_??]?i? ?(?H???p?p??|?k?N?;??p?L??t?b??Z??o??p?"?T??p?p?j??,?2?p?&?k?m?o???}?+?J?(?]??-?H?S?D?J?\?z?p?-?~? ?]?b???Y??z?p?b?3?H?P? ?X?|?9???R??P?m?U?U?)?^??R?>?l?*?K??O?>T?J?k?b?>]?2?B?>j?a?/?V?P?p?M?Q?0??>|?8?;?>>>??b?>!?O?H??B?K?x??*?]?`?n?P?"?0?G??%?A? ?M?t??m?;?2?o?f?c??a?b?n???0?,?X?f?@?%?>u?N?o??o?G?p?`?P?6?P??D?0?J?M?_???O?f?4??3? ?>W?`??Y?C?f??P?m?O?P?6?A?M?0?k???z?&?I?N?S?u?w?)?}?f?H?V?I?_?>g?? \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_453.const b/unet/.cache/NhwcConv_0-conv_inConv_453.const deleted file mode 100644 index e2108afa7a5eeeeabf019e2f5becbb64f388da3d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_453.const +++ /dev/null @@ -1 +0,0 @@ - ޻P>;.@<,<;I=>;B{}}===>==%>Q,==L=Rz_7=ɻ==<Ȼ=;=<=<<=ȼi:h>н=%>>>;9=μ=@(==='A==*J>==>cd>_==i<<=<=SE=E(Ͻ`B>0<<^:$ >>=ǼQ<<|;=<1;=0==$=Vsdn=޽pν9<7=.6>Q>>0)"=s=潳=Cݼ==(<#>m<(><^=2;C<<p>:=4=::R=ke>= 9==e=0=>>==>l<=м><.[=<6O=Xӽ=t{<3>,>꼋g=:<\=Vg<===.ͼ=!=:n<<K=L;[<==&7_=i=v=1;==:N<\=>=;ZX>={<]<>P==s%>: \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_454.const b/unet/.cache/NhwcConv_0-conv_inConv_454.const deleted file mode 100644 index fb3290b7f2203b217b9bcf6ef7a6bb25b0ad290b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_454.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f979af0fa880bd7c8b6c2a0d01db11f869cb227768b7cf93a74691811f167f67 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_455.const b/unet/.cache/NhwcConv_0-conv_inConv_455.const deleted file mode 100644 index e049a5ed11509070d346a955b9bbd41eb20a1939..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_455.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:528a4912ef85a2c76e735defae3543e3dfe78afd88373a1b8da2287a65fd1603 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_456.const b/unet/.cache/NhwcConv_0-conv_inConv_456.const deleted file mode 100644 index 0af9c5056d169caefb1b77bed15fc4dc08580274..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_456.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d3428ae71198efa3a18e8dce2bebcd6f848884adefc264c7c47bb90b5aec1838 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_457.const b/unet/.cache/NhwcConv_0-conv_inConv_457.const deleted file mode 100644 index 45aee9e3c4983d38d29f0dd1b45475e06cc69b96..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_457.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:acffaafcdc5193071e4eb76289e6405388869772d5d2a79546d371a428b2d06d -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_458.const b/unet/.cache/NhwcConv_0-conv_inConv_458.const deleted file mode 100644 index 5095a1e3b90df04eaf67e94758f86f6602de73c6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_458.const +++ /dev/null @@ -1 +0,0 @@ -> >>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>s>>>>>>>>>>>>>>>>>>>>>>>>>>=>>>>>o>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>y>>>>>>>>>>>>>>>>d>>>>>>>>>>>>>>>Y>>>>>>>>>>>|>z>>>>>>>w>>>>>>>>>>>>>>>g>>>>>>>>>>>C>>>>>>>>>o>>>>>g>>>>>>>>>>>>>>>>>>>>>>>>>>>>N>>>>>>>>>>>>d>>>>>>>>>>>>b>>>A>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_459.const b/unet/.cache/NhwcConv_0-conv_inConv_459.const deleted file mode 100644 index b65d6845d41e31cf225da71b728ad48e7e6a0410..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_459.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_46.const b/unet/.cache/NhwcConv_0-conv_inConv_46.const deleted file mode 100644 index 16a8f22033eab848957ea487b0cfa089031da11a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_46.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0de364da701591e50f90c837aa03b420525b6db5a584ed78b5cc70b471dc21d0 -size 467200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_460.const b/unet/.cache/NhwcConv_0-conv_inConv_460.const deleted file mode 100644 index 94b40f5a8b8964c5f9fd41a07a22e43391095a87..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_460.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:12caf26fffcd872dc8037c200bcf21c60fe761da7b110afdbf64dc0ba6a59f56 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_461.const b/unet/.cache/NhwcConv_0-conv_inConv_461.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_461.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_462.const b/unet/.cache/NhwcConv_0-conv_inConv_462.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_462.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_463.const b/unet/.cache/NhwcConv_0-conv_inConv_463.const deleted file mode 100644 index e53ca130c91e0ddd28f0708bda1ff11edb3e22da..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_463.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b8a01aabda2e5d0ce7d4968f7d62cc09631d6eef7f1e2cef17e6390c57017257 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_464.const b/unet/.cache/NhwcConv_0-conv_inConv_464.const deleted file mode 100644 index 2e506e3e40769bbc586758588b09ee9ea98ba53c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_464.const +++ /dev/null @@ -1 +0,0 @@ - ?-?*??7?0? ?5?6?4?B?7?*?8?6?,? ?:?/?(?2?(?1?4?2?E?G? ?(?-??:?C?0?-?3??0?.? ?=?8?)?>??3? ?+?8?,?2?H?!?K?=?,?3?-?5?9?%?1?0??0??/?"?4?.?)?9?-?I?U?"?F?P??.?A?5?$?+?=?@?H?(?=?$???A?D??)??-?&?6?4?'?5?'?0??9?8??6???0?:?*?!?,??#???>?7? ?/?;???>/?:?/?4??0?1?9?5?>?$?(??3?*?4?2?>5?0?H??>>D?-?"????*?'?9??>0?)?.?'?)?/?4?>C?9?-?8??6?8?(??0?5?@?2?(?+??4??7?,?,?2?0?!?+?0?5??7?X?;?'?>G?(?1?:??9?3?,??????3?,??0?!?B?>4?)?>:???>#?5?&?1?B?"?;?B??/?5? ?&?4?(??7??#?3?'?.???,?&?D?-?(??5?,??;?(?>?>>9?>>>?>7?????$?>8?R?>>>>???z?>>??8?>?>>??P?(?>?!??>*??>?!?S?> ?>>j?>> ?>?(?&?.?>1?$?> ?? ?G?>>?>>? -??o??>5?>>,??>?>?>??>>?>? ?1?>?(?!?>>> ??I?B?>>?>>P??? ?*?$?> ?>+?>R? ?>?> -??>>t??>?(???>>?8? -?+?>>?> ?6?>>?e?>!??&???>>? ?\?P??>>7??>>9?>(?.??>u?0?,??>?>1? ?>>/?3? ?>0?3?>?.?? ??l?>(??? ?{>>>)? ?>?>0??>>=?>/?>1?>>?>)?>3??>?[?.?]?/??>B????=?>>Y?>??>>1?l?>>0?>P?>>>???>??^?>? ?>>7?????>[?>>l?L?>>?? ?_?>>?>>?8?&??>>"?7??>?]"M`ƽE!phi(սM/>boNF`(H} zN1\iy!0j񽼽^aCB+ZN2 ĽcL;¾񽤾QFCnxa0@c3h$iuCOktJ2j6#8Er.ggz[40ҽGIJ㽬V+ֽtfn|꾡;ҽK^ #=LOM@d-NpHk W4Hsn, d ٽ0P.޽- /p6̾jP1ֽ: Q -J -Ľ;m[Y󽒾-p?j&w%!ʾU3~/t3#@v].ebe \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_480.const b/unet/.cache/NhwcConv_0-conv_inConv_480.const deleted file mode 100644 index f491e4bb79c9d9d5f228d35a23a8143fc7181741..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_480.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:fc75b9ab43c9ee5b7ca5edbae72463d099197d66826786d5c4fceda7e5453d0c -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_481.const b/unet/.cache/NhwcConv_0-conv_inConv_481.const deleted file mode 100644 index 0fb3bd4ea0122607b6fa6ece826c0122c806df51..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_481.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a0bd244ae1278e405112862b2d1a1ce40f66f9438d19e52794e21a6f0664e818 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_482.const b/unet/.cache/NhwcConv_0-conv_inConv_482.const deleted file mode 100644 index 23cb2da0c2ef24d701970aae4c20e2f57bba2a04..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_482.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:238b277a6bc15270c2f2fcf2a0f4fe4d172029ed22b7e4f15fa93bfc61abefa4 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_483.const b/unet/.cache/NhwcConv_0-conv_inConv_483.const deleted file mode 100644 index b91579337abe682e2d772fc288d9eaf11c52754d..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_483.const +++ /dev/null @@ -1 +0,0 @@ ->>>>>>>>>>>>>>>>>>>>>>>>>>>>>k>>>g>>>>x>>>>>>>>h>>>>w>v>>>|>>>>>>>{>>>>t>>>n>>>>>>>>>>>>>>>>>>s>>>>>>>>>>>>>>>>>>{>>>>>>>>>>>>>>>>>>>>>>>>>>>>`>>q>>>>Z>>>n>>>>a>>>>>>>>>>>>>>>>>>>>o>n>Q>>>>>>>>>>]>>>>>>>>>>>>>>>>d>>>>>>>>>>>~>>>>>>>>>>{>>>>>>>>>>k>>>>>>>>>>>>>>>>l>>>>>>>y>>>g>>>>>>>>>>>>>>>>\>>>>>>>g>>>>>>>>s>>>>y>>>>>>>>|>>>>>>>>>>>>>>>>>l>p>>>>y>>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_484.const b/unet/.cache/NhwcConv_0-conv_inConv_484.const deleted file mode 100644 index 96d5250c1ac795a686669819e11b23a8d0447fb3..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_484.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_485.const b/unet/.cache/NhwcConv_0-conv_inConv_485.const deleted file mode 100644 index c56a2cf8c56df783afc1fc7884d571086528a2bb..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_485.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2e2953060fcd4ed80f2c7b7389fa1d051ad1f23bdc511e6037728e7a6fc351c9 -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_486.const b/unet/.cache/NhwcConv_0-conv_inConv_486.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_486.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_487.const b/unet/.cache/NhwcConv_0-conv_inConv_487.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_487.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_488.const b/unet/.cache/NhwcConv_0-conv_inConv_488.const deleted file mode 100644 index 0e34ad04d39499e5e1f2f00ecb6cf1ca8172cf94..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_488.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5d4e13b55cc1668b50c09b7c1661bd8abdd128e5c60af7147a5fd876098216e5 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_489.const b/unet/.cache/NhwcConv_0-conv_inConv_489.const deleted file mode 100644 index 7f7872b4126351b9b20b6e7b21d3f55f408b2f79..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_489.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_49.const b/unet/.cache/NhwcConv_0-conv_inConv_49.const deleted file mode 100644 index 5a419173f9ce99c6b08b577dbd43f94dc9c01308..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_49.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:938a42340d9f12adbdef239f4202e047efea1f363b161326ef3c44538f06f2b0 -size 1077760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_490.const b/unet/.cache/NhwcConv_0-conv_inConv_490.const deleted file mode 100644 index 2ea056c1861dce2c5ba5a0f43032287d0e9b2019..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_490.const +++ /dev/null @@ -1,4 +0,0 @@ -=<====!=lk==#9=;==:Rq:h>=Q#< Ǽ=<<;lf\<;=>>F>>1>l>>U>>>l>>>>|>>>>>>>>>z>>>>>>>F>>>>>>>>>m>>>>>>>>>>>>>>>>>>>>>>{>g>>>>>>>>>>>>>>>>x>>>>>>>>>>>>>>>>>O>>>>>>>>>>>>}>>>>>o>>>>>>>Z>x>r>>>>>>>>>>>>>>>>k>>>>>>>>>>>>>>>>>>>>>>>>>>>>>y>y>>>>~>>>>>>>>~>>>>>\>>>>>>e>>>>>v>>s>>>>>U>i>>>>~>>>z>>t>>>>>>>~>I>>>>>>>>>>>>>>>>>>>k>>>>>>2>>>>>>>>>>>>>}>g>>w>>>>>>>>>O>>>>y>>>P>>m>>>>>>>>m>>>>>>c>]>>>t>p>>>>>>>>>x>p>>>>>n>>>>>> \ No newline at end of file diff --git a/unet/.cache/NhwcConv_0-conv_inConv_59.const b/unet/.cache/NhwcConv_0-conv_inConv_59.const deleted file mode 100644 index fb3ac4d6a70cdbafb20ba5fe62959a787b749225..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_59.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_6.const b/unet/.cache/NhwcConv_0-conv_inConv_6.const deleted file mode 100644 index 0873591a6c2afa00bd34faf28a3cf2d64034f37e..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_6.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c06b2aa8d3ec87e9cc323c1f3619c0cde384e91d8c3f0ac07053096d77c6eb13 -size 281600 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_60.const b/unet/.cache/NhwcConv_0-conv_inConv_60.const deleted file mode 100644 index c3b08cfc2e5b9ba2ec5263b7cae9256563c55a0b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_60.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:01e16c94f58d169fd2df434e2f118dbb979c3a0763bd3815ae2cd72e718f89cd -size 118400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_61.const b/unet/.cache/NhwcConv_0-conv_inConv_61.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_61.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_62.const b/unet/.cache/NhwcConv_0-conv_inConv_62.const deleted file mode 100644 index 00bc0474794e909101dcb2b0c7c809cfbe2bd665..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_62.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_63.const b/unet/.cache/NhwcConv_0-conv_inConv_63.const deleted file mode 100644 index 4c464c45d18e01480ccdf9aa999589f76e428565..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_63.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:873d1b8eb5865b827a1ccee1f74cad27adef21d63b8204d861c24949ee96a0d7 -size 117760 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_64.const b/unet/.cache/NhwcConv_0-conv_inConv_64.const deleted file mode 100644 index 6d115947bae641a1dd5ed6cd4d1137593a1516ac..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_64.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_65.const b/unet/.cache/NhwcConv_0-conv_inConv_65.const deleted file mode 100644 index 4281e0e5a574bd22e0e53c03d82ec866914aeb5a..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_65.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_66.const b/unet/.cache/NhwcConv_0-conv_inConv_66.const deleted file mode 100644 index a87b75c5e8064de0e5e47d78370a146f075025b5..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_66.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9f9cb51b78e28e5bc94f373fded2e74355f13163e83b59b8e00d3a2c68957d80 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_67.const b/unet/.cache/NhwcConv_0-conv_inConv_67.const deleted file mode 100644 index 545ef0f9e5eb597f5b4dc131461e93b7ae789a77..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_67.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e412bf9366ccc834bcfe9325d86b6eae3f8e903878a03111c19f53a5099dc784 -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_68.const b/unet/.cache/NhwcConv_0-conv_inConv_68.const deleted file mode 100644 index aa700116e8af71bc88697ad3dd271b805f054926..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_68.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9d8f24e5fd90c73982d57ad4ed0c436a09f99d87035088ee9226d8c50369b67c -size 471040 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_69.const b/unet/.cache/NhwcConv_0-conv_inConv_69.const deleted file mode 100644 index a9e31859ee03115f5dee493bae0f7cb0db14308c..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_69.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e532c487302ac8d7fea4147185ea5ee924a66bdef55edfa5057a79d785884b67 -size 125440 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_7.const b/unet/.cache/NhwcConv_0-conv_inConv_7.const deleted file mode 100644 index f70003c68586ab9f6dd094b97b8bde825c6282bd..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_7.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5b659ae95cd22761b049d947e6821a12f2d0ca2103440776525f63506a77dc42 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_70.const b/unet/.cache/NhwcConv_0-conv_inConv_70.const deleted file mode 100644 index fb8ff262a8a237dd87583cb2b501de7fb3f9d83b..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_70.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5aebd18ad661265b3e5408c9112e0a295b87af0f8a260bca21fb64000389f332 -size 1062400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_71.const b/unet/.cache/NhwcConv_0-conv_inConv_71.const deleted file mode 100644 index cc772948649fe1c2def3ecec3fb660be2a16c40e..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_71.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_72.const b/unet/.cache/NhwcConv_0-conv_inConv_72.const deleted file mode 100644 index 1f36d557869ec0bcc2e8be127197bd91faf4ffc7..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_72.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9a2752ee2641aaa14a0ab33b408145fc787ad2e6d602f183c4eab71acbf4e488 -size 934400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_73.const b/unet/.cache/NhwcConv_0-conv_inConv_73.const deleted file mode 100644 index 2cc14771ae77d9111a76c015f9699312c750b8e4..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_73.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5c7b20fcf5e2c9dbbbd7e0ac4f9c2662920ee6d562743c7c0e9c202c42549b98 -size 2155520 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_74.const b/unet/.cache/NhwcConv_0-conv_inConv_74.const deleted file mode 100644 index f1e66a7937d0a6aaea5113ae40d0b9cf5a87a7ae..0000000000000000000000000000000000000000 Binary files a/unet/.cache/NhwcConv_0-conv_inConv_74.const and /dev/null differ diff --git a/unet/.cache/NhwcConv_0-conv_inConv_75.const b/unet/.cache/NhwcConv_0-conv_inConv_75.const deleted file mode 100644 index a5a802f1a5841f56f36081a5b7bc1f55f06ac924..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_75.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:994ac55ce51e678683b7f2d0ceb767a5928f4338a4ae598923919088f84ff621 -size 934400 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_76.const b/unet/.cache/NhwcConv_0-conv_inConv_76.const deleted file mode 100644 index 2695cfa9d198484333eb29dfba7e97bcf14139d9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_76.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4146eb1b8ce67a742a55bd34e3f3b06626f18c8fdb5812a256db2b45cea74e3b -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_77.const b/unet/.cache/NhwcConv_0-conv_inConv_77.const deleted file mode 100644 index fff381dfec5cc9be2dab4f2326de966e04adbb47..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_77.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:63661b0e685fbb4b2ef2ceba92e850f750e486ac7aee39c48b884de37d7c276f -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_78.const b/unet/.cache/NhwcConv_0-conv_inConv_78.const deleted file mode 100644 index 3c2affbbe3da49ce5c3fa35e599b2960096aecab..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_78.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ee8a1ef7c5e1b7c8c7112bc2350af7ec1403079797acfe90dcb078b07f305aeb -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_79.const b/unet/.cache/NhwcConv_0-conv_inConv_79.const deleted file mode 100644 index d856b8a3884d0d8b4a3ce736e1319aef82ac5b5a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_79.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b5557b3f3c9b96644672fa1ee0c57ceed6a9c8df36348099ceafac6912ac5f60 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_8.const b/unet/.cache/NhwcConv_0-conv_inConv_8.const deleted file mode 100644 index 8cd4301ab00305cd1ec1e35e0cec32b046026ef6..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_8.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:61e9bdc6a3932ee60be0794b45ebdd216588b7d7428ed93fc18c363de3704909 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_80.const b/unet/.cache/NhwcConv_0-conv_inConv_80.const deleted file mode 100644 index c504773f0f5a8a070a1e26d4e9bb313b66318ca0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_80.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d15485edcb26c0d8816609865e3ca0030be934bf7a74a5804b7b2e49b797ed2b -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_81.const b/unet/.cache/NhwcConv_0-conv_inConv_81.const deleted file mode 100644 index 9c9fec9ed310115e40108dbe409de77ffaa29474..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_81.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:7f5c0a4d15bf1c1af3e88451f0b083cfd3f2daf8033961b20723965d3e261eb9 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_82.const b/unet/.cache/NhwcConv_0-conv_inConv_82.const deleted file mode 100644 index 1306f2e97259430bf3834de7a1b2aedb28aea791..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_82.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:131d634459b640242f49443e7068dcae3cbfd512edd4b8de3ce6ba8c25713581 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_83.const b/unet/.cache/NhwcConv_0-conv_inConv_83.const deleted file mode 100644 index fbbdc7004a4ee5ec085025974133dba3d89dbf99..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_83.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2a688b9f29c21e57c8e7f0c5cc1b24093dcb89899f8494c2491f32a26db7140c -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_84.const b/unet/.cache/NhwcConv_0-conv_inConv_84.const deleted file mode 100644 index 72126f1d08a411d0f5fd4ae68961984c73e9d78f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_84.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e399808f2408200f07176c756c53c76c7941b1e57c2f0a7ec1b1e089ea035d1b -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_85.const b/unet/.cache/NhwcConv_0-conv_inConv_85.const deleted file mode 100644 index 3c0b31b3088497b907c5471e65dd5e89ae103e70..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_85.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:078bd6d5826c0e2c5be187c4b69bd5acbc9ac3962a9074d32d1fac046e271487 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_86.const b/unet/.cache/NhwcConv_0-conv_inConv_86.const deleted file mode 100644 index 8653adf228260bfa9e2ea86a3d7994641eab0c45..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_86.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:4b5e4f635b867ada41356def4111c943167d4dd6eb54e8a0bbde2796e6a8e918 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_87.const b/unet/.cache/NhwcConv_0-conv_inConv_87.const deleted file mode 100644 index e2afa5869cfad2580d7ec17078ce821342b35aac..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_87.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:f446ab62a954467234b2b992896bbacc73296115fbe726ced969ea2043294d75 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_88.const b/unet/.cache/NhwcConv_0-conv_inConv_88.const deleted file mode 100644 index 0d3e251c7e46a4fcb03c4d7668ec355e1607d9d0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_88.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c23ad2538eb607c1fafd1c89bfcda0ad72bb524c58455c296e3828d407823d2c -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_89.const b/unet/.cache/NhwcConv_0-conv_inConv_89.const deleted file mode 100644 index efecd44b0be53a2f790a7b2a123b39c1e387d0c3..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_89.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5e25c1fbc4f5b0c1572ed493670ea81b80b61566b2e4e0055928ffd568a83c09 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_9.const b/unet/.cache/NhwcConv_0-conv_inConv_9.const deleted file mode 100644 index 57f55acdc8b1207e80e1f9ae0220929c45e9fe79..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_9.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cbde8cd519c432872eb57fb1fa024b780f46f74c3d3c81533960ee0a67347279 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_90.const b/unet/.cache/NhwcConv_0-conv_inConv_90.const deleted file mode 100644 index 658ee4817d88c1ecf974e695d03726260800e56a..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_90.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:54c32b51d26135f2cc4318b4cae0619b1ff38bdd379c365d7dd7badf79e98146 -size 1121280 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_91.const b/unet/.cache/NhwcConv_0-conv_inConv_91.const deleted file mode 100644 index 2350a5683992cb6556b7f5c3150c427f52955bde..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_91.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:995884c073b37f77778761d9ee73763ac85b656135062a81c58a616f09b69764 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_92.const b/unet/.cache/NhwcConv_0-conv_inConv_92.const deleted file mode 100644 index 49522dcec1f27e7a1dd7e0993f78b7686e7edeb0..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_92.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:efc5c4c8e8c41d4d37a89fc7a5231ae1633a11e94e59239a1e49d1a5e164dd29 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_93.const b/unet/.cache/NhwcConv_0-conv_inConv_93.const deleted file mode 100644 index 68830b1d11c30c6c879004ed69b139433479e791..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_93.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:24b9694ff10e150d35e531beed84b5161b8beb0212b59c7ea7ac7ab346022946 -size 1868800 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_94.const b/unet/.cache/NhwcConv_0-conv_inConv_94.const deleted file mode 100644 index 7479c0448fbd6f8e90d1a7448c5492a0edfd2ab9..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_94.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:2f375bd438bbdf8785539ab73331ea5b9d5ba720dc53b222f3bbb0b697ebd299 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_95.const b/unet/.cache/NhwcConv_0-conv_inConv_95.const deleted file mode 100644 index 076509d6d647e13fc195270aed5cfe38742f1a10..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_95.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:548ab2dd5d218d24da2e10a77a04c3a38b98294e781cde1d0fb9c29d79401978 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_96.const b/unet/.cache/NhwcConv_0-conv_inConv_96.const deleted file mode 100644 index d5c2c24bdd29828855d42e1984d4b15a783a62a2..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_96.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:24439d5ebdb3c26dba4bcf53bc4846d448764a838abad08c4bf21d6eee772a4b -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_97.const b/unet/.cache/NhwcConv_0-conv_inConv_97.const deleted file mode 100644 index cf0a5da59d410041a94ae4c60ed9086164736001..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_97.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c0e90c480c5c8b804e9bbd1f96cd17b939a9e4b8d4b9b2025e22989908e2d4e3 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_98.const b/unet/.cache/NhwcConv_0-conv_inConv_98.const deleted file mode 100644 index 43e12f0ec2da204d05a0856662b649a72f86f0cb..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_98.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:086a9b39fbb93fb7a29d14940a729cc61a089e628f7cc39b6da2de3723812682 -size 563200 diff --git a/unet/.cache/NhwcConv_0-conv_inConv_99.const b/unet/.cache/NhwcConv_0-conv_inConv_99.const deleted file mode 100644 index 0f9d3da0cf07459c145b60f1be95716f131dfb3f..0000000000000000000000000000000000000000 --- a/unet/.cache/NhwcConv_0-conv_inConv_99.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5a5bdd1d8f3d3ec701356ce9c51adf94f115bcb4145635f5f983496dc33a82f5 -size 563200 diff --git a/unet/.cache/ops-config.json b/unet/.cache/ops-config.json deleted file mode 100644 index 1eab74d48442f43ebf32c5693bb50defff724adb..0000000000000000000000000000000000000000 --- a/unet/.cache/ops-config.json +++ /dev/null @@ -1,558 +0,0 @@ -{ - "xclbin": "stx_SD_unet_fastpm_2x4x4", - "overlay_json": "", - "overlay": "2x4x4", - "comment": "S: Sign", - "backend_target": "DD", - "model_type": "SD15_UNET", - "op_types": [ - { - "op_type": "GemmTrans", - "attrs": [ - { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - } - }, - { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - } - } - ], - "inputs": [ - [ - [ - 2, - 4096, - 320 - ], - [ - 320, - 320 - ], - [ - 320 - ] - ], - [ - [ - 2, - 1024, - 640 - ], - [ - 640, - 640 - ], - [ - 640 - ] - ], - [ - [ - 2, - 256, - 1280 - ], - [ - 1280, - 1280 - ], - [ - 1280 - ] - ], - [ - [ - 2, - 64, - 1280 - ], - [ - 1280, - 1280 - ], - [ - 1280 - ] - ], - [ - [ - 2, - 4096, - 320 - ], - [ - 320, - 320 - ], - [ - 320 - ] - ], - [ - [ - 2, - 1024, - 640 - ], - [ - 640, - 640 - ], - [ - 640 - ] - ], - [ - [ - 2, - 256, - 1280 - ], - [ - 1280, - 1280 - ], - [ - 1280 - ] - ] - ], - "outputs": [ - [ - 2, - 8, - 4096, - 40 - ], - [ - 2, - 8, - 1024, - 80 - ], - [ - 2, - 8, - 256, - 160 - ], - [ - 2, - 8, - 64, - 160 - ], - [ - 2, - 8, - 4096, - 40 - ], - [ - 2, - 8, - 1024, - 80 - ], - [ - 2, - 8, - 256, - 160 - ] - ] - } - ] -} \ No newline at end of file diff --git a/unet/config.json b/unet/config.json new file mode 100644 index 0000000000000000000000000000000000000000..1a02ee8abc93e840ffbcb2d68b66ccbcb74b3ab3 --- /dev/null +++ b/unet/config.json @@ -0,0 +1,36 @@ +{ + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.6.0", + "act_fn": "silu", + "attention_head_dim": 8, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_scale_factor": 1, + "norm_eps": 1e-05, + "norm_num_groups": 32, + "out_channels": 4, + "sample_size": 64, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ] +} diff --git a/unet/.cache/NhwcConv_0-conv_inConv_meta.json b/unet/dd/cache/NhwcConv_0-conv_inConv_meta.json similarity index 92% rename from unet/.cache/NhwcConv_0-conv_inConv_meta.json rename to unet/dd/cache/NhwcConv_0-conv_inConv_meta.json index db9af699fe4b6a6e9a529de06b90633be5754f89..49c0b441d891c7fec5e40847a55eb0fd416102c6 100644 --- a/unet/.cache/NhwcConv_0-conv_inConv_meta.json +++ b/unet/dd/cache/NhwcConv_0-conv_inConv_meta.json @@ -1,63223 +1,63206 @@ -{ - "dd_meta_major_version": 1, - "dd_meta_minor_version": 4, - "state_table_updates": [], - "op_list": [ - { - "name": "NhwcConv_0-/conv_in/Conv", - "type": "SDConv", - "in_args": [ - "Transpose_44_out-sample.out0_1_0" - ], - "const_args": [ - "NhwcConv_0_weight_NHWC" - ], - "out_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "4" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "4" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_SDCastBf2Bfp_7_0", - "type": "SDCastBf2Bfp", - "in_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" - ], - "const_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts7_0" - ], - "out_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_0", - "type": "SDGroupNorm_bfp", - "in_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" - ], - "const_args": [ - "GroupNorm_0_wts_6_0_0" - ], - "out_args": [ - "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5660" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5661" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5690" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5691" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5720" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5721" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5750" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5751" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5780" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5781" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5810" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5811" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5848" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5849" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/time_embedding/linear_1/Gemm", - "type": "SDGemm", - "in_args": [ - "/time_proj/Concat_1_output_0.out2_3_0" - ], - "const_args": [ - "time_embedding.linear_1.weight_11_1_0" - ], - "out_args": [ - "/time_embedding/linear_1/Gemm_output_0.out2_3_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid", - "type": "SDSilu", - "in_args": [ - "/time_embedding/linear_1/Gemm_output_0.out2_3_0" - ], - "const_args": [ - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0" - ], - "out_args": [ - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "128" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/time_embedding/linear_2/Gemm", - "type": "SDGemm", - "in_args": [ - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0" - ], - "const_args": [ - "time_embedding.linear_2.weight_11_1_1" - ], - "out_args": [ - "/time_embedding/linear_2/Gemm_output_0.out2_3_1" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid", - "type": "SDSilu", - "in_args": [ - "/time_embedding/linear_2/Gemm_output_0.out2_3_1" - ], - "const_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1" - ], - "out_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "128" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2" - ], - "out_args": [ - "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_1-/down_blocks.0/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0" - ], - "const_args": [ - "NhwcConv_1_weight_NHWC" - ], - "out_args": [ - "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1", - "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_1", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0" - ], - "const_args": [ - "GroupNorm_1_wts_6_0_1" - ], - "out_args": [ - "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_2-/down_blocks.0/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1" - ], - "const_args": [ - "NhwcConv_2_weight_NHWC" - ], - "out_args": [ - "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0", - "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_2", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" - ], - "const_args": [ - "GroupNorm_2_wts_6_2_0" - ], - "out_args": [ - "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_3-/down_blocks.0/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2" - ], - "const_args": [ - "NhwcConv_3_weight_NHWC" - ], - "out_args": [ - "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" - ], - "const_args": [ - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" - ], - "const_args": [ - "Attention_0_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" - ], - "const_args": [ - "Attention_0_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" - ], - "const_args": [ - "Attention_0_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_0", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_1_0" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "4096" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_1_0" - ], - "const_args": [ - "onnx::MatMul_5658_11_0_0" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75", - "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" - ], - "const_args": [ - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1" - ], - "const_args": [ - "onnx::MatMul_5659" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_0", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0" - ], - "const_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0.wts9_0" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_0", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_SDCastBf2Bfp_9_76", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" - ], - "const_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts9_76" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76" - ], - "const_args": [ - "onnx::MatMul_5669_11_0_1" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76", - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" - ], - "const_args": [ - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_0_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" - ], - "const_args": [ - "onnx::MatMul_5670_11_0_2_12_0_0" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_0_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" - ], - "const_args": [ - "onnx::MatMul_5670_11_0_2_12_0_1" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78", - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0" - ], - "const_args": [ - "onnx::MatMul_5671_11_0_3" - ], - "out_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79", - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_4-/down_blocks.0/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4" - ], - "const_args": [ - "NhwcConv_4_weight_NHWC" - ], - "out_args": [ - "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4", - "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_3", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" - ], - "const_args": [ - "GroupNorm_3_wts_6_0_2" - ], - "out_args": [ - "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3" - ], - "out_args": [ - "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_5-/down_blocks.0/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3" - ], - "const_args": [ - "NhwcConv_5_weight_NHWC" - ], - "out_args": [ - "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5", - "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_4", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6" - ], - "const_args": [ - "GroupNorm_4_wts_6_0_3" - ], - "out_args": [ - "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_6-/down_blocks.0/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4" - ], - "const_args": [ - "NhwcConv_6_weight_NHWC" - ], - "out_args": [ - "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5", - "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_5", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" - ], - "const_args": [ - "GroupNorm_5_wts_6_2_1" - ], - "out_args": [ - "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_7-/down_blocks.0/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5" - ], - "const_args": [ - "NhwcConv_7_weight_NHWC" - ], - "out_args": [ - "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" - ], - "const_args": [ - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" - ], - "const_args": [ - "Attention_1_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" - ], - "const_args": [ - "Attention_1_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" - ], - "const_args": [ - "Attention_1_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_1", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_1_1" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "4096" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_1_1" - ], - "const_args": [ - "onnx::MatMul_5688_11_0_4" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83", - "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" - ], - "const_args": [ - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4" - ], - "const_args": [ - "onnx::MatMul_5689" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_3", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3" - ], - "const_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3.wts9_3" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_1", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_SDCastBf2Bfp_9_84", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" - ], - "const_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts9_84" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84" - ], - "const_args": [ - "onnx::MatMul_5699_11_0_5" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84", - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" - ], - "const_args": [ - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_1_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" - ], - "const_args": [ - "onnx::MatMul_5700_11_0_6_12_1_0" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_1_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" - ], - "const_args": [ - "onnx::MatMul_5700_11_0_6_12_1_1" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86", - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1" - ], - "const_args": [ - "onnx::MatMul_5701_11_0_7" - ], - "out_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87", - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_8-/down_blocks.0/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10" - ], - "const_args": [ - "NhwcConv_8_weight_NHWC" - ], - "out_args": [ - "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.0/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8", - "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" - ], - "const_args": [], - "out_args": [ - "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_9-/down_blocks.0/downsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" - ], - "const_args": [ - "NhwcConv_9_weight_NHWC" - ], - "out_args": [ - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "2", - "2" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_6", - "type": "SDGroupNorm_bfp", - "in_args": [ - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" - ], - "const_args": [ - "GroupNorm_6_wts_6_0_4" - ], - "out_args": [ - "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4" - ], - "out_args": [ - "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_10-/down_blocks.1/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6" - ], - "const_args": [ - "NhwcConv_10_weight_NHWC" - ], - "out_args": [ - "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11", - "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_7", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12" - ], - "const_args": [ - "GroupNorm_7_wts_6_0_5" - ], - "out_args": [ - "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5" - ], - "out_args": [ - "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6" - ], - "out_args": [ - "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7" - ], - "out_args": [ - "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8" - ], - "out_args": [ - "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9" - ], - "out_args": [ - "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "mid_block.resnets.0.time_emb_proj.weight_11_1_10" - ], - "out_args": [ - "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "mid_block.resnets.1.time_emb_proj.weight_11_1_11" - ], - "out_args": [ - "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12" - ], - "out_args": [ - "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13" - ], - "out_args": [ - "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.2/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14" - ], - "out_args": [ - "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5895" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5896" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5925" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5926" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5955" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5956" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15" - ], - "out_args": [ - "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16" - ], - "out_args": [ - "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.2/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17" - ], - "out_args": [ - "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5986" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_5987" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6016" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6017" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6046" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6047" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18" - ], - "out_args": [ - "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19" - ], - "out_args": [ - "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.2/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20" - ], - "out_args": [ - "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6077" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6078" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6107" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6108" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6137" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", - "type": "SDGemm", - "in_args": [ - "encoder_hidden_states.out2_6_0" - ], - "const_args": [ - "onnx::MatMul_6138" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "77", - "768" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "77", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "768", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.0/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21" - ], - "out_args": [ - "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.1/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22" - ], - "out_args": [ - "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.2/time_emb_proj/Gemm", - "type": "SDGemm", - "in_args": [ - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" - ], - "const_args": [ - "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23" - ], - "out_args": [ - "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_11-/down_blocks.1/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7" - ], - "const_args": [ - "NhwcConv_11_weight_NHWC" - ], - "out_args": [ - "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_12-/down_blocks.1/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" - ], - "const_args": [ - "NhwcConv_12_weight_NHWC" - ], - "out_args": [ - "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10", - "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_8", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" - ], - "const_args": [ - "GroupNorm_8_wts_6_2_2" - ], - "out_args": [ - "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_13-/down_blocks.1/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8" - ], - "const_args": [ - "NhwcConv_13_weight_NHWC" - ], - "out_args": [ - "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" - ], - "const_args": [ - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" - ], - "const_args": [ - "Attention_2_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" - ], - "const_args": [ - "Attention_2_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" - ], - "const_args": [ - "Attention_2_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_2", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_1_2" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "1024" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_1_2" - ], - "const_args": [ - "onnx::MatMul_5718_11_0_8" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91", - "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" - ], - "const_args": [ - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7" - ], - "const_args": [ - "onnx::MatMul_5719" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_6", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6" - ], - "const_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6.wts9_6" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_2", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_SDCastBf2Bfp_9_92", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" - ], - "const_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts9_92" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92" - ], - "const_args": [ - "onnx::MatMul_5729_11_0_9" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92", - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" - ], - "const_args": [ - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_2_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" - ], - "const_args": [ - "onnx::MatMul_5730_11_0_10_12_2_0" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_2_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" - ], - "const_args": [ - "onnx::MatMul_5730_11_0_10_12_2_1" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94", - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2" - ], - "const_args": [ - "onnx::MatMul_5731_11_0_11" - ], - "out_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "2560", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95", - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_14-/down_blocks.1/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16" - ], - "const_args": [ - "NhwcConv_14_weight_NHWC" - ], - "out_args": [ - "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14", - "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_9", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" - ], - "const_args": [ - "GroupNorm_9_wts_6_0_6" - ], - "out_args": [ - "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_15-/down_blocks.1/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9" - ], - "const_args": [ - "NhwcConv_15_weight_NHWC" - ], - "out_args": [ - "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15", - "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_10", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18" - ], - "const_args": [ - "GroupNorm_10_wts_6_0_7" - ], - "out_args": [ - "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_16-/down_blocks.1/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10" - ], - "const_args": [ - "NhwcConv_16_weight_NHWC" - ], - "out_args": [ - "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17", - "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_11", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" - ], - "const_args": [ - "GroupNorm_11_wts_6_2_3" - ], - "out_args": [ - "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_17-/down_blocks.1/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11" - ], - "const_args": [ - "NhwcConv_17_weight_NHWC" - ], - "out_args": [ - "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" - ], - "const_args": [ - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" - ], - "const_args": [ - "Attention_3_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" - ], - "const_args": [ - "Attention_3_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" - ], - "const_args": [ - "Attention_3_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_3", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_1_3" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "1024" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_1_3" - ], - "const_args": [ - "onnx::MatMul_5748_11_0_12" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99", - "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" - ], - "const_args": [ - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10" - ], - "const_args": [ - "onnx::MatMul_5749" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_9", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9" - ], - "const_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9.wts9_9" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_3", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_SDCastBf2Bfp_9_100", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" - ], - "const_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts9_100" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100" - ], - "const_args": [ - "onnx::MatMul_5759_11_0_13" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100", - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" - ], - "const_args": [ - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_3_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" - ], - "const_args": [ - "onnx::MatMul_5760_11_0_14_12_3_0" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_3_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" - ], - "const_args": [ - "onnx::MatMul_5760_11_0_14_12_3_1" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102", - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3" - ], - "const_args": [ - "onnx::MatMul_5761_11_0_15" - ], - "out_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "2560", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103", - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_18-/down_blocks.1/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22" - ], - "const_args": [ - "NhwcConv_18_weight_NHWC" - ], - "out_args": [ - "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.1/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18", - "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" - ], - "const_args": [], - "out_args": [ - "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_19-/down_blocks.1/downsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" - ], - "const_args": [ - "NhwcConv_19_weight_NHWC" - ], - "out_args": [ - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "2", - "2" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_12", - "type": "SDGroupNorm_bfp", - "in_args": [ - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" - ], - "const_args": [ - "GroupNorm_12_wts_6_0_8" - ], - "out_args": [ - "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_20-/down_blocks.2/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12" - ], - "const_args": [ - "NhwcConv_20_weight_NHWC" - ], - "out_args": [ - "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21", - "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_13", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24" - ], - "const_args": [ - "GroupNorm_13_wts_6_0_9" - ], - "out_args": [ - "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_21-/down_blocks.2/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13" - ], - "const_args": [ - "NhwcConv_21_weight_NHWC" - ], - "out_args": [ - "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_22-/down_blocks.2/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" - ], - "const_args": [ - "NhwcConv_22_weight_NHWC" - ], - "out_args": [ - "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20", - "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_14", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" - ], - "const_args": [ - "GroupNorm_14_wts_6_2_4" - ], - "out_args": [ - "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_23-/down_blocks.2/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14" - ], - "const_args": [ - "NhwcConv_23_weight_NHWC" - ], - "out_args": [ - "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" - ], - "const_args": [ - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" - ], - "const_args": [ - "Attention_4_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" - ], - "const_args": [ - "Attention_4_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" - ], - "const_args": [ - "Attention_4_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_4", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_1_4" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "256" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_1_4" - ], - "const_args": [ - "onnx::MatMul_5778_11_0_16" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107", - "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" - ], - "const_args": [ - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13" - ], - "const_args": [ - "onnx::MatMul_5779" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_12", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12" - ], - "const_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12.wts9_12" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_4", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_SDCastBf2Bfp_9_108", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" - ], - "const_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts9_108" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108" - ], - "const_args": [ - "onnx::MatMul_5789_11_0_17" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108", - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" - ], - "const_args": [ - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_4_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" - ], - "const_args": [ - "onnx::MatMul_5790_11_0_18_12_4_0" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_4_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" - ], - "const_args": [ - "onnx::MatMul_5790_11_0_18_12_4_1" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110", - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4" - ], - "const_args": [ - "onnx::MatMul_5791_11_0_19" - ], - "out_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111", - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_24-/down_blocks.2/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28" - ], - "const_args": [ - "NhwcConv_24_weight_NHWC" - ], - "out_args": [ - "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24", - "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_15", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" - ], - "const_args": [ - "GroupNorm_15_wts_6_0_10" - ], - "out_args": [ - "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_25-/down_blocks.2/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15" - ], - "const_args": [ - "NhwcConv_25_weight_NHWC" - ], - "out_args": [ - "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25", - "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_16", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30" - ], - "const_args": [ - "GroupNorm_16_wts_6_0_11" - ], - "out_args": [ - "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_26-/down_blocks.2/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16" - ], - "const_args": [ - "NhwcConv_26_weight_NHWC" - ], - "out_args": [ - "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29", - "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_17", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" - ], - "const_args": [ - "GroupNorm_17_wts_6_2_5" - ], - "out_args": [ - "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_27-/down_blocks.2/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17" - ], - "const_args": [ - "NhwcConv_27_weight_NHWC" - ], - "out_args": [ - "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" - ], - "const_args": [ - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" - ], - "const_args": [ - "Attention_5_qkv_weight_key" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" - ], - "const_args": [ - "Attention_5_qkv_weight_query" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" - ], - "const_args": [ - "Attention_5_qkv_weight_value" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_5", - "type": "SDMHA_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_1_5" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "256" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_1_5" - ], - "const_args": [ - "onnx::MatMul_5808_11_0_20" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115", - "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" - ], - "const_args": [ - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16" - ], - "const_args": [ - "onnx::MatMul_5809" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_15", - "type": "SDCastBfp2Bf", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15" - ], - "const_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15.wts9_15" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_5", - "type": "SDFlatMHA", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_SDCastBf2Bfp_9_116", - "type": "SDCastBf2Bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" - ], - "const_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts9_116" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116" - ], - "const_args": [ - "onnx::MatMul_5819_11_0_21" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116", - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" - ], - "const_args": [ - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_5_0", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" - ], - "const_args": [ - "onnx::MatMul_5820_11_0_22_12_5_0" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_5_1", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" - ], - "const_args": [ - "onnx::MatMul_5820_11_0_22_12_5_1" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118", - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5" - ], - "const_args": [ - "onnx::MatMul_5821_11_0_23" - ], - "out_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119", - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_28-/down_blocks.2/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34" - ], - "const_args": [ - "NhwcConv_28_weight_NHWC" - ], - "out_args": [ - "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.2/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28", - "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" - ], - "const_args": [], - "out_args": [ - "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_29-/down_blocks.2/downsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" - ], - "const_args": [ - "NhwcConv_29_weight_NHWC" - ], - "out_args": [ - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "2", - "2" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_18", - "type": "SDGroupNorm_bfp", - "in_args": [ - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" - ], - "const_args": [ - "GroupNorm_18_wts_6_0_12" - ], - "out_args": [ - "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_30-/down_blocks.3/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18" - ], - "const_args": [ - "NhwcConv_30_weight_NHWC" - ], - "out_args": [ - "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30", - "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6" - ], - "const_args": [], - "out_args": [ - "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_19", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36" - ], - "const_args": [ - "GroupNorm_19_wts_6_0_13" - ], - "out_args": [ - "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_31-/down_blocks.3/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19" - ], - "const_args": [ - "NhwcConv_31_weight_NHWC" - ], - "out_args": [ - "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29", - "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31" - ], - "const_args": [], - "out_args": [ - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_20", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" - ], - "const_args": [ - "GroupNorm_20_wts_6_0_14" - ], - "out_args": [ - "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_32-/down_blocks.3/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20" - ], - "const_args": [ - "NhwcConv_32_weight_NHWC" - ], - "out_args": [ - "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32", - "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7" - ], - "const_args": [], - "out_args": [ - "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_21", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38" - ], - "const_args": [ - "GroupNorm_21_wts_6_0_15" - ], - "out_args": [ - "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_33-/down_blocks.3/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21" - ], - "const_args": [ - "NhwcConv_33_weight_NHWC" - ], - "out_args": [ - "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/down_blocks.3/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37", - "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33" - ], - "const_args": [], - "out_args": [ - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_22", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" - ], - "const_args": [ - "GroupNorm_22_wts_6_0_16" - ], - "out_args": [ - "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_34-/mid_block/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22" - ], - "const_args": [ - "NhwcConv_34_weight_NHWC" - ], - "out_args": [ - "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34", - "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8" - ], - "const_args": [], - "out_args": [ - "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_23", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40" - ], - "const_args": [ - "GroupNorm_23_wts_6_0_17" - ], - "out_args": [ - "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_35-/mid_block/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23" - ], - "const_args": [ - "NhwcConv_35_weight_NHWC" - ], - "out_args": [ - "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39", - "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35" - ], - "const_args": [], - "out_args": [ - "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_24", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" - ], - "const_args": [ - "GroupNorm_24_wts_6_2_6" - ], - "out_args": [ - "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_36-/mid_block/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24" - ], - "const_args": [ - "NhwcConv_36_weight_NHWC" - ], - "out_args": [ - "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" - ], - "const_args": [ - "mid_block.attentions.0.transformer_blocks.0.norm1.weight", - "mid_block.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" - ], - "const_args": [ - "Attention_6_qkv_weight_key" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" - ], - "const_args": [ - "Attention_6_qkv_weight_query" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" - ], - "const_args": [ - "Attention_6_qkv_weight_value" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key_SDCastBfp2Bf_9_121", - "type": "SDCastBfp2Bf", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121.wts9_121" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query_SDCastBfp2Bf_9_120", - "type": "SDCastBfp2Bf", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120.wts9_120" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value_SDCastBfp2Bf_9_122", - "type": "SDCastBfp2Bf", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122.wts9_122" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_6", - "type": "SDFlatMHA", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "160", - "64" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_SDCastBf2Bfp_9_123", - "type": "SDCastBf2Bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts9_123" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123" - ], - "const_args": [ - "onnx::MatMul_5846_11_0_24" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123", - "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" - ], - "const_args": [ - "mid_block.attentions.0.transformer_blocks.0.norm2.weight", - "mid_block.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19" - ], - "const_args": [ - "onnx::MatMul_5847" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_18", - "type": "SDCastBfp2Bf", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18.wts9_18" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "64", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_6", - "type": "SDFlatMHA", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_SDCastBf2Bfp_9_124", - "type": "SDCastBf2Bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" - ], - "const_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts9_124" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124" - ], - "const_args": [ - "onnx::MatMul_5857_11_0_25" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124", - "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" - ], - "const_args": [ - "mid_block.attentions.0.transformer_blocks.0.norm3.weight", - "mid_block.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_6_0", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" - ], - "const_args": [ - "onnx::MatMul_5858_11_0_26_12_6_0" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_6_1", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" - ], - "const_args": [ - "onnx::MatMul_5858_11_0_26_12_6_1" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126", - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6" - ], - "const_args": [ - "onnx::MatMul_5859_11_0_27" - ], - "out_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127", - "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_37-/mid_block/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44" - ], - "const_args": [ - "NhwcConv_37_weight_NHWC" - ], - "out_args": [ - "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37", - "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" - ], - "const_args": [], - "out_args": [ - "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_25", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45" - ], - "const_args": [ - "GroupNorm_25_wts_6_0_18" - ], - "out_args": [ - "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_38-/mid_block/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25" - ], - "const_args": [ - "NhwcConv_38_weight_NHWC" - ], - "out_args": [ - "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38", - "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9" - ], - "const_args": [], - "out_args": [ - "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_26", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46" - ], - "const_args": [ - "GroupNorm_26_wts_6_0_19" - ], - "out_args": [ - "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_39-/mid_block/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26" - ], - "const_args": [ - "NhwcConv_39_weight_NHWC" - ], - "out_args": [ - "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/mid_block/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45", - "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39" - ], - "const_args": [], - "out_args": [ - "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/Concat", - "type": "SDConcat_bfp", - "in_args": [ - "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47", - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/Concat.out19_1_bfp.out20_0" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_27", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/Concat.out19_1_bfp.out20_0" - ], - "const_args": [ - "GroupNorm_27_wts_6_0_20" - ], - "out_args": [ - "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "5120" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_40-/up_blocks.0/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27" - ], - "const_args": [ - "NhwcConv_40_weight_NHWC" - ], - "out_args": [ - "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41", - "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_28", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48" - ], - "const_args": [ - "GroupNorm_28_wts_6_0_21" - ], - "out_args": [ - "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_41-/up_blocks.0/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28" - ], - "const_args": [ - "NhwcConv_41_weight_NHWC" - ], - "out_args": [ - "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_42-/up_blocks.0/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.0/Concat.out19_1_bfp.out20_0" - ], - "const_args": [ - "NhwcConv_42_weight_NHWC" - ], - "out_args": [ - "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40", - "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/Concat_1", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49", - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_29", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" - ], - "const_args": [ - "GroupNorm_29_wts_6_0_22" - ], - "out_args": [ - "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "5120" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_43-/up_blocks.0/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29" - ], - "const_args": [ - "NhwcConv_43_weight_NHWC" - ], - "out_args": [ - "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44", - "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_30", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50" - ], - "const_args": [ - "GroupNorm_30_wts_6_0_23" - ], - "out_args": [ - "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_44-/up_blocks.0/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30" - ], - "const_args": [ - "NhwcConv_44_weight_NHWC" - ], - "out_args": [ - "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_45-/up_blocks.0/resnets.1/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" - ], - "const_args": [ - "NhwcConv_45_weight_NHWC" - ], - "out_args": [ - "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43", - "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/Concat_2", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51", - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_31", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" - ], - "const_args": [ - "GroupNorm_31_wts_6_0_24" - ], - "out_args": [ - "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "5120" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_46-/up_blocks.0/resnets.2/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31" - ], - "const_args": [ - "NhwcConv_46_weight_NHWC" - ], - "out_args": [ - "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47", - "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_32", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52" - ], - "const_args": [ - "GroupNorm_32_wts_6_0_25" - ], - "out_args": [ - "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_47-/up_blocks.0/resnets.2/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32" - ], - "const_args": [ - "NhwcConv_47_weight_NHWC" - ], - "out_args": [ - "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_48-/up_blocks.0/resnets.2/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" - ], - "const_args": [ - "NhwcConv_48_weight_NHWC" - ], - "out_args": [ - "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/resnets.2/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46", - "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48" - ], - "const_args": [], - "out_args": [ - "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.0/upsamplers.0/Resize", - "type": "SDResize_bfp", - "in_args": [ - "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53" - ], - "const_args": [ - "/up_blocks.0/upsamplers.0/Resize.weights3_0" - ], - "out_args": [ - "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "8", - "8", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_49-/up_blocks.0/upsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0" - ], - "const_args": [ - "NhwcConv_49_weight_NHWC" - ], - "out_args": [ - "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/Concat", - "type": "SDConcat_bfp", - "in_args": [ - "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49", - "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/Concat.out19_4_bfp.out20_3" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_33", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/Concat.out19_4_bfp.out20_3" - ], - "const_args": [ - "GroupNorm_33_wts_6_0_26" - ], - "out_args": [ - "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "5120" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_50-/up_blocks.1/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33" - ], - "const_args": [ - "NhwcConv_50_weight_NHWC" - ], - "out_args": [ - "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51", - "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_34", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54" - ], - "const_args": [ - "GroupNorm_34_wts_6_0_27" - ], - "out_args": [ - "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_51-/up_blocks.1/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34" - ], - "const_args": [ - "NhwcConv_51_weight_NHWC" - ], - "out_args": [ - "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_52-/up_blocks.1/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/Concat.out19_4_bfp.out20_3" - ], - "const_args": [ - "NhwcConv_52_weight_NHWC" - ], - "out_args": [ - "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50", - "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_35", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" - ], - "const_args": [ - "GroupNorm_35_wts_6_2_7" - ], - "out_args": [ - "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_53-/up_blocks.1/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35" - ], - "const_args": [ - "NhwcConv_53_weight_NHWC" - ], - "out_args": [ - "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" - ], - "const_args": [ - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" - ], - "const_args": [ - "Attention_7_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" - ], - "const_args": [ - "Attention_7_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" - ], - "const_args": [ - "Attention_7_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_7", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_1_6" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "256" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_1_6" - ], - "const_args": [ - "onnx::MatMul_5893_11_0_28" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131", - "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" - ], - "const_args": [ - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22" - ], - "const_args": [ - "onnx::MatMul_5894" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_21", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21" - ], - "const_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21.wts9_21" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_7", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_SDCastBf2Bfp_9_132", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" - ], - "const_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts9_132" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132" - ], - "const_args": [ - "onnx::MatMul_5904_11_0_29" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132", - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" - ], - "const_args": [ - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_7_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" - ], - "const_args": [ - "onnx::MatMul_5905_11_0_30_12_7_0" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_7_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" - ], - "const_args": [ - "onnx::MatMul_5905_11_0_30_12_7_1" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134", - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7" - ], - "const_args": [ - "onnx::MatMul_5906_11_0_31" - ], - "out_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135", - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_54-/up_blocks.1/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58" - ], - "const_args": [ - "NhwcConv_54_weight_NHWC" - ], - "out_args": [ - "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54", - "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/Concat_1", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59", - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_36", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" - ], - "const_args": [ - "GroupNorm_36_wts_6_0_28" - ], - "out_args": [ - "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "5120" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_55-/up_blocks.1/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36" - ], - "const_args": [ - "NhwcConv_55_weight_NHWC" - ], - "out_args": [ - "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56", - "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_37", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60" - ], - "const_args": [ - "GroupNorm_37_wts_6_0_29" - ], - "out_args": [ - "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_56-/up_blocks.1/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37" - ], - "const_args": [ - "NhwcConv_56_weight_NHWC" - ], - "out_args": [ - "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_57-/up_blocks.1/resnets.1/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" - ], - "const_args": [ - "NhwcConv_57_weight_NHWC" - ], - "out_args": [ - "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "2560" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55", - "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_38", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" - ], - "const_args": [ - "GroupNorm_38_wts_6_2_8" - ], - "out_args": [ - "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_58-/up_blocks.1/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38" - ], - "const_args": [ - "NhwcConv_58_weight_NHWC" - ], - "out_args": [ - "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" - ], - "const_args": [ - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" - ], - "const_args": [ - "Attention_8_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" - ], - "const_args": [ - "Attention_8_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" - ], - "const_args": [ - "Attention_8_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_8", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_1_7" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "256" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_1_7" - ], - "const_args": [ - "onnx::MatMul_5923_11_0_32" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139", - "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" - ], - "const_args": [ - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25" - ], - "const_args": [ - "onnx::MatMul_5924" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_24", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24" - ], - "const_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24.wts9_24" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_8", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_SDCastBf2Bfp_9_140", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" - ], - "const_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts9_140" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140" - ], - "const_args": [ - "onnx::MatMul_5934_11_0_33" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140", - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" - ], - "const_args": [ - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_8_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" - ], - "const_args": [ - "onnx::MatMul_5935_11_0_34_12_8_0" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_8_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" - ], - "const_args": [ - "onnx::MatMul_5935_11_0_34_12_8_1" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142", - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8" - ], - "const_args": [ - "onnx::MatMul_5936_11_0_35" - ], - "out_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143", - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_59-/up_blocks.1/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64" - ], - "const_args": [ - "NhwcConv_59_weight_NHWC" - ], - "out_args": [ - "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59", - "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/Concat_2", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65", - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1920" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_39", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" - ], - "const_args": [ - "GroupNorm_39_wts_6_0_30" - ], - "out_args": [ - "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1920" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "3840" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_60-/up_blocks.1/resnets.2/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39" - ], - "const_args": [ - "NhwcConv_60_weight_NHWC" - ], - "out_args": [ - "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1920" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61", - "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_40", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66" - ], - "const_args": [ - "GroupNorm_40_wts_6_0_31" - ], - "out_args": [ - "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_61-/up_blocks.1/resnets.2/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40" - ], - "const_args": [ - "NhwcConv_61_weight_NHWC" - ], - "out_args": [ - "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_62-/up_blocks.1/resnets.2/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" - ], - "const_args": [ - "NhwcConv_62_weight_NHWC" - ], - "out_args": [ - "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1920" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/resnets.2/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60", - "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_41", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" - ], - "const_args": [ - "GroupNorm_41_wts_6_2_9" - ], - "out_args": [ - "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_63-/up_blocks.1/attentions.2/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41" - ], - "const_args": [ - "NhwcConv_63_weight_NHWC" - ], - "out_args": [ - "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" - ], - "const_args": [ - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" - ], - "const_args": [ - "Attention_9_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" - ], - "const_args": [ - "Attention_9_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" - ], - "const_args": [ - "Attention_9_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_9", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_1_8" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "256" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_1_8" - ], - "const_args": [ - "onnx::MatMul_5953_11_0_36" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147", - "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" - ], - "const_args": [ - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28" - ], - "const_args": [ - "onnx::MatMul_5954" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_27", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27" - ], - "const_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27.wts9_27" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "256", - "160" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_9", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "160", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_SDCastBf2Bfp_9_148", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" - ], - "const_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts9_148" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148" - ], - "const_args": [ - "onnx::MatMul_5964_11_0_37" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148", - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" - ], - "const_args": [ - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_9_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" - ], - "const_args": [ - "onnx::MatMul_5965_11_0_38_12_9_0" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_9_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" - ], - "const_args": [ - "onnx::MatMul_5965_11_0_38_12_9_1" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "5120" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150", - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9" - ], - "const_args": [ - "onnx::MatMul_5966_11_0_39" - ], - "out_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "256", - "5120" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "5120", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151", - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "256", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_64-/up_blocks.1/attentions.2/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70" - ], - "const_args": [ - "NhwcConv_64_weight_NHWC" - ], - "out_args": [ - "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/attentions.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64", - "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" - ], - "const_args": [], - "out_args": [ - "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.1/upsamplers.0/Resize", - "type": "SDResize_bfp", - "in_args": [ - "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71" - ], - "const_args": [ - "/up_blocks.1/upsamplers.0/Resize.weights3_1" - ], - "out_args": [ - "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "16", - "16", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_65-/up_blocks.1/upsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1" - ], - "const_args": [ - "NhwcConv_65_weight_NHWC" - ], - "out_args": [ - "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/Concat", - "type": "SDConcat_bfp", - "in_args": [ - "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65", - "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/Concat.out19_7_bfp.out20_6" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1920" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_42", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/Concat.out19_7_bfp.out20_6" - ], - "const_args": [ - "GroupNorm_42_wts_6_0_32" - ], - "out_args": [ - "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1920" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "3840" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_66-/up_blocks.2/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42" - ], - "const_args": [ - "NhwcConv_66_weight_NHWC" - ], - "out_args": [ - "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "1920" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67", - "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_43", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72" - ], - "const_args": [ - "GroupNorm_43_wts_6_0_33" - ], - "out_args": [ - "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_67-/up_blocks.2/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43" - ], - "const_args": [ - "NhwcConv_67_weight_NHWC" - ], - "out_args": [ - "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_68-/up_blocks.2/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/Concat.out19_7_bfp.out20_6" - ], - "const_args": [ - "NhwcConv_68_weight_NHWC" - ], - "out_args": [ - "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1920" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "1920" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66", - "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_44", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" - ], - "const_args": [ - "GroupNorm_44_wts_6_2_10" - ], - "out_args": [ - "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_69-/up_blocks.2/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44" - ], - "const_args": [ - "NhwcConv_69_weight_NHWC" - ], - "out_args": [ - "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" - ], - "const_args": [ - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" - ], - "const_args": [ - "Attention_10_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" - ], - "const_args": [ - "Attention_10_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" - ], - "const_args": [ - "Attention_10_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_10", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_1_9" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "1024" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_1_9" - ], - "const_args": [ - "onnx::MatMul_5984_11_0_40" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155", - "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" - ], - "const_args": [ - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31" - ], - "const_args": [ - "onnx::MatMul_5985" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_30", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30" - ], - "const_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30.wts9_30" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_10", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_SDCastBf2Bfp_9_156", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" - ], - "const_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts9_156" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156" - ], - "const_args": [ - "onnx::MatMul_5995_11_0_41" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156", - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" - ], - "const_args": [ - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_10_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" - ], - "const_args": [ - "onnx::MatMul_5996_11_0_42_12_10_0" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_10_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" - ], - "const_args": [ - "onnx::MatMul_5996_11_0_42_12_10_1" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158", - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10" - ], - "const_args": [ - "onnx::MatMul_5997_11_0_43" - ], - "out_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "2560", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159", - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_70-/up_blocks.2/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76" - ], - "const_args": [ - "NhwcConv_70_weight_NHWC" - ], - "out_args": [ - "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70", - "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/Concat_1", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77", - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_45", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" - ], - "const_args": [ - "GroupNorm_45_wts_6_0_34" - ], - "out_args": [ - "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "2560" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_71-/up_blocks.2/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45" - ], - "const_args": [ - "NhwcConv_71_weight_NHWC" - ], - "out_args": [ - "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72", - "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_46", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78" - ], - "const_args": [ - "GroupNorm_46_wts_6_0_35" - ], - "out_args": [ - "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_72-/up_blocks.2/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46" - ], - "const_args": [ - "NhwcConv_72_weight_NHWC" - ], - "out_args": [ - "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_73-/up_blocks.2/resnets.1/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" - ], - "const_args": [ - "NhwcConv_73_weight_NHWC" - ], - "out_args": [ - "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "1280" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71", - "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_47", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" - ], - "const_args": [ - "GroupNorm_47_wts_6_2_11" - ], - "out_args": [ - "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_74-/up_blocks.2/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47" - ], - "const_args": [ - "NhwcConv_74_weight_NHWC" - ], - "out_args": [ - "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" - ], - "const_args": [ - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" - ], - "const_args": [ - "Attention_11_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" - ], - "const_args": [ - "Attention_11_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" - ], - "const_args": [ - "Attention_11_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_11", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_1_10" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "1024" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_1_10" - ], - "const_args": [ - "onnx::MatMul_6014_11_0_44" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163", - "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" - ], - "const_args": [ - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34" - ], - "const_args": [ - "onnx::MatMul_6015" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_33", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33" - ], - "const_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33.wts9_33" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_11", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_SDCastBf2Bfp_9_164", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" - ], - "const_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts9_164" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164" - ], - "const_args": [ - "onnx::MatMul_6025_11_0_45" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164", - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" - ], - "const_args": [ - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_11_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" - ], - "const_args": [ - "onnx::MatMul_6026_11_0_46_12_11_0" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_11_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" - ], - "const_args": [ - "onnx::MatMul_6026_11_0_46_12_11_1" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166", - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11" - ], - "const_args": [ - "onnx::MatMul_6027_11_0_47" - ], - "out_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "2560", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167", - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_75-/up_blocks.2/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82" - ], - "const_args": [ - "NhwcConv_75_weight_NHWC" - ], - "out_args": [ - "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75", - "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/Concat_2", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83", - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "960" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_48", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" - ], - "const_args": [ - "GroupNorm_48_wts_6_0_36" - ], - "out_args": [ - "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "960" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "960" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "960" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_76-/up_blocks.2/resnets.2/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48" - ], - "const_args": [ - "NhwcConv_76_weight_NHWC" - ], - "out_args": [ - "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "960" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77", - "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_49", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84" - ], - "const_args": [ - "GroupNorm_49_wts_6_0_37" - ], - "out_args": [ - "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_77-/up_blocks.2/resnets.2/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49" - ], - "const_args": [ - "NhwcConv_77_weight_NHWC" - ], - "out_args": [ - "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_78-/up_blocks.2/resnets.2/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" - ], - "const_args": [ - "NhwcConv_78_weight_NHWC" - ], - "out_args": [ - "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "960" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/resnets.2/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76", - "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_50", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" - ], - "const_args": [ - "GroupNorm_50_wts_6_2_12" - ], - "out_args": [ - "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_79-/up_blocks.2/attentions.2/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50" - ], - "const_args": [ - "NhwcConv_79_weight_NHWC" - ], - "out_args": [ - "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" - ], - "const_args": [ - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" - ], - "const_args": [ - "Attention_12_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" - ], - "const_args": [ - "Attention_12_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" - ], - "const_args": [ - "Attention_12_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_12", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_1_11" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "1024" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_1_11" - ], - "const_args": [ - "onnx::MatMul_6044_11_0_48" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171", - "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" - ], - "const_args": [ - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37" - ], - "const_args": [ - "onnx::MatMul_6045" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_36", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36" - ], - "const_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36.wts9_36" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "1024", - "80" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_12", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "80", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_SDCastBf2Bfp_9_172", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" - ], - "const_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts9_172" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172" - ], - "const_args": [ - "onnx::MatMul_6055_11_0_49" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172", - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" - ], - "const_args": [ - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_12_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" - ], - "const_args": [ - "onnx::MatMul_6056_11_0_50_12_12_0" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_12_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" - ], - "const_args": [ - "onnx::MatMul_6056_11_0_50_12_12_1" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "2560" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174", - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12" - ], - "const_args": [ - "onnx::MatMul_6057_11_0_51" - ], - "out_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "1024", - "2560" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "2560", - "640" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175", - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "1024", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_80-/up_blocks.2/attentions.2/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88" - ], - "const_args": [ - "NhwcConv_80_weight_NHWC" - ], - "out_args": [ - "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/attentions.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80", - "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" - ], - "const_args": [], - "out_args": [ - "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.2/upsamplers.0/Resize", - "type": "SDResize_bfp", - "in_args": [ - "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89" - ], - "const_args": [ - "/up_blocks.2/upsamplers.0/Resize.weights3_2" - ], - "out_args": [ - "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "32", - "32", - "640" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_81-/up_blocks.2/upsamplers.0/conv/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2" - ], - "const_args": [ - "NhwcConv_81_weight_NHWC" - ], - "out_args": [ - "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "640", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/Concat", - "type": "SDConcat_bfp", - "in_args": [ - "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81", - "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/Concat.out19_10_bfp.out20_9" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "960" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_51", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/Concat.out19_10_bfp.out20_9" - ], - "const_args": [ - "GroupNorm_51_wts_6_0_38" - ], - "out_args": [ - "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "960" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1920" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "960" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "960" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_82-/up_blocks.3/resnets.0/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51" - ], - "const_args": [ - "NhwcConv_82_weight_NHWC" - ], - "out_args": [ - "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "960" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83", - "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_52", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90" - ], - "const_args": [ - "GroupNorm_52_wts_6_0_39" - ], - "out_args": [ - "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_83-/up_blocks.3/resnets.0/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52" - ], - "const_args": [ - "NhwcConv_83_weight_NHWC" - ], - "out_args": [ - "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_84-/up_blocks.3/resnets.0/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/Concat.out19_10_bfp.out20_9" - ], - "const_args": [ - "NhwcConv_84_weight_NHWC" - ], - "out_args": [ - "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "960" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "960" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82", - "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_53", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" - ], - "const_args": [ - "GroupNorm_53_wts_6_2_13" - ], - "out_args": [ - "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_85-/up_blocks.3/attentions.0/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53" - ], - "const_args": [ - "NhwcConv_85_weight_NHWC" - ], - "out_args": [ - "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" - ], - "const_args": [ - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" - ], - "const_args": [ - "Attention_13_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" - ], - "const_args": [ - "Attention_13_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" - ], - "const_args": [ - "Attention_13_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_13", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_1_12" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "4096" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_1_12" - ], - "const_args": [ - "onnx::MatMul_6075_11_0_52" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179", - "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" - ], - "const_args": [ - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40" - ], - "const_args": [ - "onnx::MatMul_6076" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_39", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39" - ], - "const_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39.wts9_39" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_13", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_SDCastBf2Bfp_9_180", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" - ], - "const_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts9_180" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180" - ], - "const_args": [ - "onnx::MatMul_6086_11_0_53" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180", - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" - ], - "const_args": [ - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_13_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" - ], - "const_args": [ - "onnx::MatMul_6087_11_0_54_12_13_0" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_13_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" - ], - "const_args": [ - "onnx::MatMul_6087_11_0_54_12_13_1" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182", - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13" - ], - "const_args": [ - "onnx::MatMul_6088_11_0_55" - ], - "out_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183", - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_86-/up_blocks.3/attentions.0/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94" - ], - "const_args": [ - "NhwcConv_86_weight_NHWC" - ], - "out_args": [ - "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86", - "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/Concat_1", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95", - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_54", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" - ], - "const_args": [ - "GroupNorm_54_wts_6_0_40" - ], - "out_args": [ - "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_87-/up_blocks.3/resnets.1/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54" - ], - "const_args": [ - "NhwcConv_87_weight_NHWC" - ], - "out_args": [ - "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88", - "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_55", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96" - ], - "const_args": [ - "GroupNorm_55_wts_6_0_41" - ], - "out_args": [ - "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_88-/up_blocks.3/resnets.1/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55" - ], - "const_args": [ - "NhwcConv_88_weight_NHWC" - ], - "out_args": [ - "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_89-/up_blocks.3/resnets.1/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" - ], - "const_args": [ - "NhwcConv_89_weight_NHWC" - ], - "out_args": [ - "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.1/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87", - "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_56", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" - ], - "const_args": [ - "GroupNorm_56_wts_6_2_14" - ], - "out_args": [ - "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_90-/up_blocks.3/attentions.1/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56" - ], - "const_args": [ - "NhwcConv_90_weight_NHWC" - ], - "out_args": [ - "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" - ], - "const_args": [ - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" - ], - "const_args": [ - "Attention_14_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" - ], - "const_args": [ - "Attention_14_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" - ], - "const_args": [ - "Attention_14_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_14", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_1_13" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "4096" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_1_13" - ], - "const_args": [ - "onnx::MatMul_6105_11_0_56" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187", - "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" - ], - "const_args": [ - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43" - ], - "const_args": [ - "onnx::MatMul_6106" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_42", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42" - ], - "const_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42.wts9_42" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_14", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_SDCastBf2Bfp_9_188", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" - ], - "const_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts9_188" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188" - ], - "const_args": [ - "onnx::MatMul_6116_11_0_57" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188", - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" - ], - "const_args": [ - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_14_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" - ], - "const_args": [ - "onnx::MatMul_6117_11_0_58_12_14_0" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_14_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" - ], - "const_args": [ - "onnx::MatMul_6117_11_0_58_12_14_1" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190", - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14" - ], - "const_args": [ - "onnx::MatMul_6118_11_0_59" - ], - "out_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191", - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_91-/up_blocks.3/attentions.1/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100" - ], - "const_args": [ - "NhwcConv_91_weight_NHWC" - ], - "out_args": [ - "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.1/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91", - "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/Concat_2", - "type": "SDConcat_bfp", - "in_args": [ - "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101", - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "3" - ] - }, - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_57", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" - ], - "const_args": [ - "GroupNorm_57_wts_6_0_42" - ], - "out_args": [ - "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "1280" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_92-/up_blocks.3/resnets.2/conv1/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57" - ], - "const_args": [ - "NhwcConv_92_weight_NHWC" - ], - "out_args": [ - "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93", - "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "1", - "1", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_58", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102" - ], - "const_args": [ - "GroupNorm_58_wts_6_0_43" - ], - "out_args": [ - "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_93-/up_blocks.3/resnets.2/conv2/Conv", - "type": "SDConv_bfp", - "in_args": [ - "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58" - ], - "const_args": [ - "NhwcConv_93_weight_NHWC" - ], - "out_args": [ - "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_94-/up_blocks.3/resnets.2/conv_shortcut/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" - ], - "const_args": [ - "NhwcConv_94_weight_NHWC" - ], - "out_args": [ - "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "640" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "640" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/resnets.2/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92", - "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_59", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" - ], - "const_args": [ - "GroupNorm_59_wts_6_2_15" - ], - "out_args": [ - "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999974752427e-07" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_95-/up_blocks.3/attentions.2/proj_in/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59" - ], - "const_args": [ - "NhwcConv_95_weight_NHWC" - ], - "out_args": [ - "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" - ], - "const_args": [ - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" - ], - "const_args": [ - "Attention_15_qkv_weight_key" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" - ], - "const_args": [ - "Attention_15_qkv_weight_query" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" - ], - "const_args": [ - "Attention_15_qkv_weight_value" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "3" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "Attention_15", - "type": "SDMHA_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_1_14" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "4096" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v2" - ] - }, - "is_flash_mha": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_1_14" - ], - "const_args": [ - "onnx::MatMul_6135_11_0_60" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195", - "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" - ], - "const_args": [ - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46" - ], - "const_args": [ - "onnx::MatMul_6136" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "head_num": { - "type": "int", - "value": [ - "8" - ] - }, - "trans_head": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_SDCastBfp2Bf_9_45", - "type": "SDCastBfp2Bf", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45" - ], - "const_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45.wts9_45" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "8", - "4096", - "40" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "MultiHeadAttention_15", - "type": "SDFlatMHA", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" - ], - "attrs": { - "num_heads": { - "type": "int", - "value": [ - "8" - ] - }, - "unidirectional": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "40", - "77" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfloat16", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "op_version": { - "type": "str", - "value": [ - "v1.1" - ] - }, - "is_flat_mha_1_1": { - "type": "int", - "value": [ - "1" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_SDCastBf2Bfp_9_196", - "type": "SDCastBf2Bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" - ], - "const_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts9_196" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196" - ], - "const_args": [ - "onnx::MatMul_6146_11_0_61" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196", - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization", - "type": "SDLayerNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" - ], - "const_args": [ - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" - ], - "attrs": { - "axis": { - "type": "int", - "value": [ - "-1" - ] - }, - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "stash_type": { - "type": "int", - "value": [ - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_15_0", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" - ], - "const_args": [ - "onnx::MatMul_6147_11_0_62_12_15_0" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Gelu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_15_1", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" - ], - "const_args": [ - "onnx::MatMul_6147_11_0_62_12_15_1" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1280" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", - "type": "SDMul_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198", - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", - "type": "SDGemm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15" - ], - "const_args": [ - "onnx::MatMul_6148_11_0_63" - ], - "out_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "4096", - "1280" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "1280", - "320" - ] - }, - "bias_enable": { - "type": "int", - "value": [ - "1" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_2", - "type": "SDAdd_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199", - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "4096", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_96-/up_blocks.3/attentions.2/proj_out/Conv", - "type": "SDConv_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106" - ], - "const_args": [ - "NhwcConv_96_weight_NHWC" - ], - "out_args": [ - "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "pads": { - "type": "int", - "value": [ - "0", - "0", - "0", - "0" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "320", - "1", - "1", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "/up_blocks.3/attentions.2/Add", - "type": "SDAdd_bfp", - "in_args": [ - "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96", - "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" - ], - "const_args": [], - "out_args": [ - "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107" - ], - "attrs": { - "a_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "b_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "c_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "is_bias_add": { - "type": "int", - "value": [ - "0" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_60", - "type": "SDGroupNorm_bfp", - "in_args": [ - "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107" - ], - "const_args": [ - "GroupNorm_60_wts_6_0_44" - ], - "out_args": [ - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60" - ], - "attrs": { - "epsilon": { - "type": "float", - "value": [ - "9.999999747378752e-06" - ] - }, - "groups": { - "type": "int", - "value": [ - "32" - ] - }, - "channels_last": { - "type": "int", - "value": [ - "1" - ] - }, - "activation": { - "type": "int", - "value": [ - "0" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "wts_shape": { - "type": "int", - "value": [ - "640" - ] - }, - "gamma_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "beta_shape": { - "type": "int", - "value": [ - "320" - ] - }, - "nonlinear": { - "type": "str", - "value": [ - "Silu" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8", - "bfloat16" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "GroupNorm_60_SDCastBfp2Bf_7_60", - "type": "SDCastBfp2Bf", - "in_args": [ - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60" - ], - "const_args": [ - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts7_60" - ], - "out_args": [ - "GroupNorm_60.out7_60.out6_0_44" - ], - "attrs": { - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfp16ebs8" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - }, - { - "name": "NhwcConv_97-/conv_out/Conv", - "type": "SDConv", - "in_args": [ - "GroupNorm_60.out7_60.out6_0_44" - ], - "const_args": [ - "NhwcConv_97_weight_NHWC" - ], - "out_args": [ - "NhwcConv_97_out-out_sample.out0_1_81" - ], - "attrs": { - "auto_pad": { - "type": "str", - "value": [ - "NOTSET" - ] - }, - "dilations": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "group": { - "type": "int", - "value": [ - "1" - ] - }, - "kernel_shape": { - "type": "int", - "value": [ - "3", - "3" - ] - }, - "pads": { - "type": "int", - "value": [ - "1", - "1", - "1", - "1" - ] - }, - "strides": { - "type": "int", - "value": [ - "1", - "1" - ] - }, - "input_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "320" - ] - }, - "output_shape": { - "type": "int", - "value": [ - "2", - "64", - "64", - "4" - ] - }, - "weight_shape": { - "type": "int", - "value": [ - "4", - "3", - "3", - "320" - ] - }, - "out_dtypes": { - "type": "str", - "value": [ - "bfloat16" - ] - }, - "in_dtypes": { - "type": "str", - "value": [ - "bfloat16", - "bfp16ebs8", - "float" - ] - }, - "ctrl_packet": { - "type": "int", - "value": [ - "1" - ] - } - } - } - ], - "fused_tensors": { - "in": { - "buffer_size": 7636224, - "xrt_arg_id": 0, - "packed_tensors": [ - "Transpose_44_out-sample.out0_1_0", - "encoder_hidden_states.out2_6_0", - "/time_proj/Concat_1_output_0.out2_3_0" - ] - }, - "out": { - "buffer_size": 65536, - "xrt_arg_id": 1, - "packed_tensors": [ - "NhwcConv_97_out-out_sample.out0_1_81" - ] - }, - "scratch": { - "buffer_size": 1059969280, - "xrt_arg_id": 2, - "packed_tensors": [ - "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0", - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0", - "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13", - "/time_embedding/linear_1/Gemm_output_0.out2_3_0", - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0", - "/time_embedding/linear_2/Gemm_output_0.out2_3_1", - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1", - "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0", - "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1", - "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0", - "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1", - "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2", - "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1", - "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2", - "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_1_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75", - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76", - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3", - "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2", - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77", - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78", - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79", - "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4", - "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4", - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5", - "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3", - "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1", - "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5", - "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6", - "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4", - "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6", - "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7", - "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5", - "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_1_1", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83", - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84", - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9", - "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5", - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85", - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86", - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1", - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87", - "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10", - "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8", - "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11", - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9", - "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6", - "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2", - "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11", - "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12", - "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7", - "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3", - "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4", - "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5", - "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6", - "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7", - "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8", - "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9", - "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10", - "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11", - "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19", - "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13", - "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14", - "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25", - "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16", - "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17", - "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31", - "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19", - "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20", - "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21", - "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12", - "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10", - "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13", - "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8", - "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_1_2", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91", - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92", - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15", - "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8", - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93", - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94", - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2", - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95", - "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16", - "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14", - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17", - "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9", - "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15", - "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18", - "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10", - "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16", - "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19", - "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11", - "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_1_3", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99", - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100", - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21", - "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11", - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101", - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102", - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3", - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103", - "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22", - "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18", - "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23", - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19", - "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12", - "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21", - "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24", - "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13", - "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22", - "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20", - "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25", - "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14", - "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_1_4", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107", - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108", - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27", - "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14", - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109", - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110", - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4", - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111", - "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28", - "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24", - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29", - "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15", - "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25", - "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30", - "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16", - "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26", - "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31", - "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17", - "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_1_5", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115", - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116", - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33", - "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17", - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117", - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118", - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5", - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119", - "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34", - "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28", - "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35", - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29", - "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18", - "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30", - "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36", - "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19", - "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31", - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37", - "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20", - "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32", - "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38", - "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21", - "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33", - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39", - "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22", - "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34", - "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40", - "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23", - "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35", - "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41", - "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24", - "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20", - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12", - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123", - "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123", - "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42", - "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38", - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13", - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124", - "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43", - "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20", - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125", - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126", - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6", - "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127", - "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44", - "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37", - "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45", - "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25", - "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38", - "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46", - "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26", - "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39", - "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47", - "/up_blocks.0/Concat.out19_1_bfp.out20_0", - "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27", - "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41", - "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48", - "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28", - "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42", - "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40", - "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49", - "/up_blocks.0/Concat_1.out19_2_bfp.out20_1", - "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29", - "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44", - "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50", - "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30", - "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45", - "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43", - "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51", - "/up_blocks.0/Concat_2.out19_3_bfp.out20_2", - "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31", - "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47", - "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52", - "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32", - "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48", - "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46", - "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53", - "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0", - "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49", - "/up_blocks.1/Concat.out19_4_bfp.out20_3", - "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33", - "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51", - "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54", - "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34", - "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52", - "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50", - "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55", - "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35", - "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_1_6", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131", - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132", - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57", - "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23", - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133", - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134", - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7", - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135", - "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58", - "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54", - "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59", - "/up_blocks.1/Concat_1.out19_5_bfp.out20_4", - "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36", - "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56", - "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60", - "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37", - "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57", - "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55", - "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61", - "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38", - "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_1_7", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139", - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140", - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63", - "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26", - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141", - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142", - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8", - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143", - "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64", - "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59", - "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65", - "/up_blocks.1/Concat_2.out19_6_bfp.out20_5", - "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39", - "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61", - "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66", - "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40", - "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62", - "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60", - "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67", - "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41", - "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_1_8", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147", - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148", - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69", - "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29", - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149", - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150", - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9", - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151", - "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70", - "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64", - "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71", - "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1", - "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65", - "/up_blocks.2/Concat.out19_7_bfp.out20_6", - "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42", - "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67", - "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72", - "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43", - "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68", - "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66", - "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73", - "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44", - "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_1_9", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155", - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156", - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75", - "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32", - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157", - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158", - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10", - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159", - "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76", - "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70", - "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77", - "/up_blocks.2/Concat_1.out19_8_bfp.out20_7", - "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45", - "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72", - "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78", - "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46", - "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73", - "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71", - "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79", - "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47", - "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_1_10", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163", - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164", - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81", - "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35", - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165", - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166", - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11", - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167", - "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82", - "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75", - "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83", - "/up_blocks.2/Concat_2.out19_9_bfp.out20_8", - "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48", - "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77", - "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84", - "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49", - "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78", - "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76", - "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85", - "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50", - "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_1_11", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171", - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172", - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87", - "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38", - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173", - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174", - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12", - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175", - "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88", - "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80", - "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89", - "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2", - "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81", - "/up_blocks.3/Concat.out19_10_bfp.out20_9", - "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51", - "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83", - "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90", - "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52", - "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84", - "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82", - "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91", - "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53", - "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_1_12", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179", - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180", - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93", - "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41", - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181", - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182", - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13", - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183", - "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94", - "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86", - "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95", - "/up_blocks.3/Concat_1.out19_11_bfp.out20_10", - "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54", - "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88", - "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96", - "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55", - "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89", - "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87", - "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97", - "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56", - "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_1_13", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187", - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188", - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99", - "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44", - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189", - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190", - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14", - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191", - "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100", - "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91", - "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101", - "/up_blocks.3/Concat_2.out19_12_bfp.out20_11", - "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57", - "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93", - "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102", - "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58", - "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94", - "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92", - "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103", - "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59", - "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_1_14", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195", - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196", - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105", - "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47", - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197", - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198", - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15", - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199", - "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106", - "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96", - "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107", - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60", - "GroupNorm_60.out7_60.out6_0_44" - ] - }, - "const": { - "buffer_size": 990629824, - "xrt_arg_id": 3, - "packed_tensors": [ - "NhwcConv_0_weight_NHWC", - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts7_0", - "GroupNorm_0_wts_6_0_0", - "onnx::MatMul_5660", - "onnx::MatMul_5661", - "onnx::MatMul_5690", - "onnx::MatMul_5691", - "onnx::MatMul_5720", - "onnx::MatMul_5721", - "onnx::MatMul_5750", - "onnx::MatMul_5751", - "onnx::MatMul_5780", - "onnx::MatMul_5781", - "onnx::MatMul_5810", - "onnx::MatMul_5811", - "onnx::MatMul_5848", - "onnx::MatMul_5849", - "time_embedding.linear_1.weight_11_1_0", - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0", - "time_embedding.linear_2.weight_11_1_1", - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1", - "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2", - "NhwcConv_1_weight_NHWC", - "GroupNorm_1_wts_6_0_1", - "NhwcConv_2_weight_NHWC", - "GroupNorm_2_wts_6_2_0", - "NhwcConv_3_weight_NHWC", - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_0_qkv_weight_key", - "Attention_0_qkv_weight_query", - "Attention_0_qkv_weight_value", - "onnx::MatMul_5658_11_0_0", - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5659", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0.wts9_0", - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts9_76", - "onnx::MatMul_5669_11_0_1", - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5670_11_0_2_12_0_0", - "onnx::MatMul_5670_11_0_2_12_0_1", - "onnx::MatMul_5671_11_0_3", - "NhwcConv_4_weight_NHWC", - "GroupNorm_3_wts_6_0_2", - "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3", - "NhwcConv_5_weight_NHWC", - "GroupNorm_4_wts_6_0_3", - "NhwcConv_6_weight_NHWC", - "GroupNorm_5_wts_6_2_1", - "NhwcConv_7_weight_NHWC", - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_1_qkv_weight_key", - "Attention_1_qkv_weight_query", - "Attention_1_qkv_weight_value", - "onnx::MatMul_5688_11_0_4", - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5689", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3.wts9_3", - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts9_84", - "onnx::MatMul_5699_11_0_5", - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5700_11_0_6_12_1_0", - "onnx::MatMul_5700_11_0_6_12_1_1", - "onnx::MatMul_5701_11_0_7", - "NhwcConv_8_weight_NHWC", - "NhwcConv_9_weight_NHWC", - "GroupNorm_6_wts_6_0_4", - "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4", - "NhwcConv_10_weight_NHWC", - "GroupNorm_7_wts_6_0_5", - "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5", - "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6", - "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7", - "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8", - "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9", - "mid_block.resnets.0.time_emb_proj.weight_11_1_10", - "mid_block.resnets.1.time_emb_proj.weight_11_1_11", - "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12", - "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13", - "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14", - "onnx::MatMul_5895", - "onnx::MatMul_5896", - "onnx::MatMul_5925", - "onnx::MatMul_5926", - "onnx::MatMul_5955", - "onnx::MatMul_5956", - "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15", - "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16", - "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17", - "onnx::MatMul_5986", - "onnx::MatMul_5987", - "onnx::MatMul_6016", - "onnx::MatMul_6017", - "onnx::MatMul_6046", - "onnx::MatMul_6047", - "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18", - "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19", - "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20", - "onnx::MatMul_6077", - "onnx::MatMul_6078", - "onnx::MatMul_6107", - "onnx::MatMul_6108", - "onnx::MatMul_6137", - "onnx::MatMul_6138", - "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21", - "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22", - "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23", - "NhwcConv_11_weight_NHWC", - "NhwcConv_12_weight_NHWC", - "GroupNorm_8_wts_6_2_2", - "NhwcConv_13_weight_NHWC", - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_2_qkv_weight_key", - "Attention_2_qkv_weight_query", - "Attention_2_qkv_weight_value", - "onnx::MatMul_5718_11_0_8", - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5719", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6.wts9_6", - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts9_92", - "onnx::MatMul_5729_11_0_9", - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5730_11_0_10_12_2_0", - "onnx::MatMul_5730_11_0_10_12_2_1", - "onnx::MatMul_5731_11_0_11", - "NhwcConv_14_weight_NHWC", - "GroupNorm_9_wts_6_0_6", - "NhwcConv_15_weight_NHWC", - "GroupNorm_10_wts_6_0_7", - "NhwcConv_16_weight_NHWC", - "GroupNorm_11_wts_6_2_3", - "NhwcConv_17_weight_NHWC", - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_3_qkv_weight_key", - "Attention_3_qkv_weight_query", - "Attention_3_qkv_weight_value", - "onnx::MatMul_5748_11_0_12", - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5749", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9.wts9_9", - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts9_100", - "onnx::MatMul_5759_11_0_13", - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5760_11_0_14_12_3_0", - "onnx::MatMul_5760_11_0_14_12_3_1", - "onnx::MatMul_5761_11_0_15", - "NhwcConv_18_weight_NHWC", - "NhwcConv_19_weight_NHWC", - "GroupNorm_12_wts_6_0_8", - "NhwcConv_20_weight_NHWC", - "GroupNorm_13_wts_6_0_9", - "NhwcConv_21_weight_NHWC", - "NhwcConv_22_weight_NHWC", - "GroupNorm_14_wts_6_2_4", - "NhwcConv_23_weight_NHWC", - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_4_qkv_weight_key", - "Attention_4_qkv_weight_query", - "Attention_4_qkv_weight_value", - "onnx::MatMul_5778_11_0_16", - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5779", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12.wts9_12", - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts9_108", - "onnx::MatMul_5789_11_0_17", - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5790_11_0_18_12_4_0", - "onnx::MatMul_5790_11_0_18_12_4_1", - "onnx::MatMul_5791_11_0_19", - "NhwcConv_24_weight_NHWC", - "GroupNorm_15_wts_6_0_10", - "NhwcConv_25_weight_NHWC", - "GroupNorm_16_wts_6_0_11", - "NhwcConv_26_weight_NHWC", - "GroupNorm_17_wts_6_2_5", - "NhwcConv_27_weight_NHWC", - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_5_qkv_weight_key", - "Attention_5_qkv_weight_query", - "Attention_5_qkv_weight_value", - "onnx::MatMul_5808_11_0_20", - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5809", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15.wts9_15", - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts9_116", - "onnx::MatMul_5819_11_0_21", - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5820_11_0_22_12_5_0", - "onnx::MatMul_5820_11_0_22_12_5_1", - "onnx::MatMul_5821_11_0_23", - "NhwcConv_28_weight_NHWC", - "NhwcConv_29_weight_NHWC", - "GroupNorm_18_wts_6_0_12", - "NhwcConv_30_weight_NHWC", - "GroupNorm_19_wts_6_0_13", - "NhwcConv_31_weight_NHWC", - "GroupNorm_20_wts_6_0_14", - "NhwcConv_32_weight_NHWC", - "GroupNorm_21_wts_6_0_15", - "NhwcConv_33_weight_NHWC", - "GroupNorm_22_wts_6_0_16", - "NhwcConv_34_weight_NHWC", - "GroupNorm_23_wts_6_0_17", - "NhwcConv_35_weight_NHWC", - "GroupNorm_24_wts_6_2_6", - "NhwcConv_36_weight_NHWC", - "mid_block.attentions.0.transformer_blocks.0.norm1.weight", - "mid_block.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_6_qkv_weight_key", - "Attention_6_qkv_weight_query", - "Attention_6_qkv_weight_value", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121.wts9_121", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120.wts9_120", - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122.wts9_122", - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts9_123", - "onnx::MatMul_5846_11_0_24", - "mid_block.attentions.0.transformer_blocks.0.norm2.weight", - "mid_block.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5847", - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18.wts9_18", - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts9_124", - "onnx::MatMul_5857_11_0_25", - "mid_block.attentions.0.transformer_blocks.0.norm3.weight", - "mid_block.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5858_11_0_26_12_6_0", - "onnx::MatMul_5858_11_0_26_12_6_1", - "onnx::MatMul_5859_11_0_27", - "NhwcConv_37_weight_NHWC", - "GroupNorm_25_wts_6_0_18", - "NhwcConv_38_weight_NHWC", - "GroupNorm_26_wts_6_0_19", - "NhwcConv_39_weight_NHWC", - "GroupNorm_27_wts_6_0_20", - "NhwcConv_40_weight_NHWC", - "GroupNorm_28_wts_6_0_21", - "NhwcConv_41_weight_NHWC", - "NhwcConv_42_weight_NHWC", - "GroupNorm_29_wts_6_0_22", - "NhwcConv_43_weight_NHWC", - "GroupNorm_30_wts_6_0_23", - "NhwcConv_44_weight_NHWC", - "NhwcConv_45_weight_NHWC", - "GroupNorm_31_wts_6_0_24", - "NhwcConv_46_weight_NHWC", - "GroupNorm_32_wts_6_0_25", - "NhwcConv_47_weight_NHWC", - "NhwcConv_48_weight_NHWC", - "/up_blocks.0/upsamplers.0/Resize.weights3_0", - "NhwcConv_49_weight_NHWC", - "GroupNorm_33_wts_6_0_26", - "NhwcConv_50_weight_NHWC", - "GroupNorm_34_wts_6_0_27", - "NhwcConv_51_weight_NHWC", - "NhwcConv_52_weight_NHWC", - "GroupNorm_35_wts_6_2_7", - "NhwcConv_53_weight_NHWC", - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_7_qkv_weight_key", - "Attention_7_qkv_weight_query", - "Attention_7_qkv_weight_value", - "onnx::MatMul_5893_11_0_28", - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5894", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21.wts9_21", - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts9_132", - "onnx::MatMul_5904_11_0_29", - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5905_11_0_30_12_7_0", - "onnx::MatMul_5905_11_0_30_12_7_1", - "onnx::MatMul_5906_11_0_31", - "NhwcConv_54_weight_NHWC", - "GroupNorm_36_wts_6_0_28", - "NhwcConv_55_weight_NHWC", - "GroupNorm_37_wts_6_0_29", - "NhwcConv_56_weight_NHWC", - "NhwcConv_57_weight_NHWC", - "GroupNorm_38_wts_6_2_8", - "NhwcConv_58_weight_NHWC", - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_8_qkv_weight_key", - "Attention_8_qkv_weight_query", - "Attention_8_qkv_weight_value", - "onnx::MatMul_5923_11_0_32", - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5924", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24.wts9_24", - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts9_140", - "onnx::MatMul_5934_11_0_33", - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5935_11_0_34_12_8_0", - "onnx::MatMul_5935_11_0_34_12_8_1", - "onnx::MatMul_5936_11_0_35", - "NhwcConv_59_weight_NHWC", - "GroupNorm_39_wts_6_0_30", - "NhwcConv_60_weight_NHWC", - "GroupNorm_40_wts_6_0_31", - "NhwcConv_61_weight_NHWC", - "NhwcConv_62_weight_NHWC", - "GroupNorm_41_wts_6_2_9", - "NhwcConv_63_weight_NHWC", - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias", - "Attention_9_qkv_weight_key", - "Attention_9_qkv_weight_query", - "Attention_9_qkv_weight_value", - "onnx::MatMul_5953_11_0_36", - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5954", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27.wts9_27", - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts9_148", - "onnx::MatMul_5964_11_0_37", - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5965_11_0_38_12_9_0", - "onnx::MatMul_5965_11_0_38_12_9_1", - "onnx::MatMul_5966_11_0_39", - "NhwcConv_64_weight_NHWC", - "/up_blocks.1/upsamplers.0/Resize.weights3_1", - "NhwcConv_65_weight_NHWC", - "GroupNorm_42_wts_6_0_32", - "NhwcConv_66_weight_NHWC", - "GroupNorm_43_wts_6_0_33", - "NhwcConv_67_weight_NHWC", - "NhwcConv_68_weight_NHWC", - "GroupNorm_44_wts_6_2_10", - "NhwcConv_69_weight_NHWC", - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_10_qkv_weight_key", - "Attention_10_qkv_weight_query", - "Attention_10_qkv_weight_value", - "onnx::MatMul_5984_11_0_40", - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_5985", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30.wts9_30", - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts9_156", - "onnx::MatMul_5995_11_0_41", - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_5996_11_0_42_12_10_0", - "onnx::MatMul_5996_11_0_42_12_10_1", - "onnx::MatMul_5997_11_0_43", - "NhwcConv_70_weight_NHWC", - "GroupNorm_45_wts_6_0_34", - "NhwcConv_71_weight_NHWC", - "GroupNorm_46_wts_6_0_35", - "NhwcConv_72_weight_NHWC", - "NhwcConv_73_weight_NHWC", - "GroupNorm_47_wts_6_2_11", - "NhwcConv_74_weight_NHWC", - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_11_qkv_weight_key", - "Attention_11_qkv_weight_query", - "Attention_11_qkv_weight_value", - "onnx::MatMul_6014_11_0_44", - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_6015", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33.wts9_33", - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts9_164", - "onnx::MatMul_6025_11_0_45", - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_6026_11_0_46_12_11_0", - "onnx::MatMul_6026_11_0_46_12_11_1", - "onnx::MatMul_6027_11_0_47", - "NhwcConv_75_weight_NHWC", - "GroupNorm_48_wts_6_0_36", - "NhwcConv_76_weight_NHWC", - "GroupNorm_49_wts_6_0_37", - "NhwcConv_77_weight_NHWC", - "NhwcConv_78_weight_NHWC", - "GroupNorm_50_wts_6_2_12", - "NhwcConv_79_weight_NHWC", - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias", - "Attention_12_qkv_weight_key", - "Attention_12_qkv_weight_query", - "Attention_12_qkv_weight_value", - "onnx::MatMul_6044_11_0_48", - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias", - "onnx::MatMul_6045", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36.wts9_36", - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts9_172", - "onnx::MatMul_6055_11_0_49", - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias", - "onnx::MatMul_6056_11_0_50_12_12_0", - "onnx::MatMul_6056_11_0_50_12_12_1", - "onnx::MatMul_6057_11_0_51", - "NhwcConv_80_weight_NHWC", - "/up_blocks.2/upsamplers.0/Resize.weights3_2", - "NhwcConv_81_weight_NHWC", - "GroupNorm_51_wts_6_0_38", - "NhwcConv_82_weight_NHWC", - "GroupNorm_52_wts_6_0_39", - "NhwcConv_83_weight_NHWC", - "NhwcConv_84_weight_NHWC", - "GroupNorm_53_wts_6_2_13", - "NhwcConv_85_weight_NHWC", - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias", - "Attention_13_qkv_weight_key", - "Attention_13_qkv_weight_query", - "Attention_13_qkv_weight_value", - "onnx::MatMul_6075_11_0_52", - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias", - "onnx::MatMul_6076", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39.wts9_39", - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts9_180", - "onnx::MatMul_6086_11_0_53", - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias", - "onnx::MatMul_6087_11_0_54_12_13_0", - "onnx::MatMul_6087_11_0_54_12_13_1", - "onnx::MatMul_6088_11_0_55", - "NhwcConv_86_weight_NHWC", - "GroupNorm_54_wts_6_0_40", - "NhwcConv_87_weight_NHWC", - "GroupNorm_55_wts_6_0_41", - "NhwcConv_88_weight_NHWC", - "NhwcConv_89_weight_NHWC", - "GroupNorm_56_wts_6_2_14", - "NhwcConv_90_weight_NHWC", - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias", - "Attention_14_qkv_weight_key", - "Attention_14_qkv_weight_query", - "Attention_14_qkv_weight_value", - "onnx::MatMul_6105_11_0_56", - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias", - "onnx::MatMul_6106", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42.wts9_42", - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts9_188", - "onnx::MatMul_6116_11_0_57", - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias", - "onnx::MatMul_6117_11_0_58_12_14_0", - "onnx::MatMul_6117_11_0_58_12_14_1", - "onnx::MatMul_6118_11_0_59", - "NhwcConv_91_weight_NHWC", - "GroupNorm_57_wts_6_0_42", - "NhwcConv_92_weight_NHWC", - "GroupNorm_58_wts_6_0_43", - "NhwcConv_93_weight_NHWC", - "NhwcConv_94_weight_NHWC", - "GroupNorm_59_wts_6_2_15", - "NhwcConv_95_weight_NHWC", - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias", - "Attention_15_qkv_weight_key", - "Attention_15_qkv_weight_query", - "Attention_15_qkv_weight_value", - "onnx::MatMul_6135_11_0_60", - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias", - "onnx::MatMul_6136", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45.wts9_45", - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts9_196", - "onnx::MatMul_6146_11_0_61", - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias", - "onnx::MatMul_6147_11_0_62_12_15_0", - "onnx::MatMul_6147_11_0_62_12_15_1", - "onnx::MatMul_6148_11_0_63", - "NhwcConv_96_weight_NHWC", - "GroupNorm_60_wts_6_0_44", - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts7_60", - "NhwcConv_97_weight_NHWC" - ] - }, - "super_instr": { - "buffer_size": 0, - "xrt_arg_id": 4, - "packed_tensors": [] - } - }, - "tensor_map": { - "Transpose_44_out-sample.out0_1_0": { - "packed_buffer_label": "in", - "xrt_arg_id": 0, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 64, - 4 - ], - "size_in_bytes": 65536, - "op_tensor_size": 65536, - "offset": 0 - }, - "encoder_hidden_states.out2_6_0": { - "packed_buffer_label": "in", - "xrt_arg_id": 0, - "dtype": "bfloat16", - "shape": [ - 2, - 77, - 768 - ], - "size_in_bytes": 236544, - "op_tensor_size": 236544, - "offset": 7399680 - }, - "/time_proj/Concat_1_output_0.out2_3_0": { - "packed_buffer_label": "in", - "xrt_arg_id": 0, - "dtype": "bfloat16", - "shape": [ - 2, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 3377152 - }, - "NhwcConv_97_out-out_sample.out0_1_81": { - "packed_buffer_label": "out", - "xrt_arg_id": 1, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 64, - 4 - ], - "size_in_bytes": 65536, - "op_tensor_size": 65536, - "offset": 0 - }, - "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 0 - }, - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 5242880 - }, - "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 7864320 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 10485760 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 10584320 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 10682880 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 10781440 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 10880000 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 11077120 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 11274240 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 11471360 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 11668480 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 12062720 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 12456960 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 12851200 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 13245440 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 13639680 - }, - "/time_embedding/linear_1/Gemm_output_0.out2_3_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 14033920 - }, - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 14039040 - }, - "/time_embedding/linear_2/Gemm_output_0.out2_3_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 14044160 - }, - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 14049280 - }, - "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 14054400 - }, - "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 14055680 - }, - "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 16677120 - }, - "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 19298560 - }, - "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 21920000 - }, - "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 24541440 - }, - "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 27162880 - }, - "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 29784320 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 32405760 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 35027200 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 37648640 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 40270080 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_1_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 42891520 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 45512960 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 48134400 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 50755840 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 53377280 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 55998720 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 61241600 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 66484480 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 69105920 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 71727360 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 74348800 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 76970240 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 87456000 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 97941760 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 108427520 - }, - "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 111048960 - }, - "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 113670400 - }, - "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 116291840 - }, - "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 118913280 - }, - "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 121534720 - }, - "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 121536000 - }, - "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 124157440 - }, - "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 126778880 - }, - "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 129400320 - }, - "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 132021760 - }, - "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 134643200 - }, - "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 137264640 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 139886080 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 142507520 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 145128960 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 147750400 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_1_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 150371840 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 152993280 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 155614720 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 158236160 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 160857600 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 163479040 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 168721920 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 173964800 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 176586240 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 179207680 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 181829120 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 184450560 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 194936320 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 205422080 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 215907840 - }, - "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 218529280 - }, - "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 221150720 - }, - "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 223772160 - }, - "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 320 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 226393600 - }, - "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 320 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 227048960 - }, - "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 640 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 227704320 - }, - "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 227706880 - }, - "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 229017600 - }, - "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 230328320 - }, - "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 640 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 231639040 - }, - "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231641600 - }, - "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231646720 - }, - "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231651840 - }, - "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231656960 - }, - "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231662080 - }, - "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231667200 - }, - "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231672320 - }, - "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231677440 - }, - "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 231682560 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 231687680 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 232081920 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 232476160 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 232870400 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 233264640 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 160 - ], - "size_in_bytes": 394240, - "op_tensor_size": 394240, - "offset": 233658880 - }, - "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 234053120 - }, - "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 234058240 - }, - "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 1280 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 234063360 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 234068480 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 234265600 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 234462720 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 234659840 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 234856960 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 80 - ], - "size_in_bytes": 197120, - "op_tensor_size": 197120, - "offset": 235054080 - }, - "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 640 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 235251200 - }, - "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 640 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 235253760 - }, - "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 640 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 235256320 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235258880 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235357440 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235456000 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235554560 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235653120 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 77, - 40 - ], - "size_in_bytes": 98560, - "op_tensor_size": 98560, - "offset": 235751680 - }, - "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 235850240 - }, - "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 235851520 - }, - "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1, - 1, - 320 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 235852800 - }, - "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 235854080 - }, - "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 237164800 - }, - "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 238475520 - }, - "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 239786240 - }, - "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 241096960 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 242407680 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 243718400 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 245029120 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 246339840 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_1_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 247650560 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 248961280 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 250272000 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 251582720 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 252893440 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 254204160 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 256825600 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 259447040 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 260757760 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 262068480 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 263379200 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 264689920 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 269932800 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 275175680 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 280418560 - }, - "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 281729280 - }, - "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 283040000 - }, - "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 284350720 - }, - "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 285661440 - }, - "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 286972160 - }, - "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 288282880 - }, - "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 289593600 - }, - "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 290904320 - }, - "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 292215040 - }, - "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 293525760 - }, - "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 294836480 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 296147200 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 297457920 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 298768640 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 300079360 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_1_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 301390080 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 302700800 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 304011520 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 305322240 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 306632960 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 307943680 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 310565120 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 313186560 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 314497280 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 315808000 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 317118720 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 318429440 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 323672320 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 328915200 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 334158080 - }, - "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 335468800 - }, - "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 336779520 - }, - "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 338090240 - }, - "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 640 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 339400960 - }, - "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 640 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 339728640 - }, - "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 340056320 - }, - "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 340711680 - }, - "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 341367040 - }, - "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 342022400 - }, - "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 342677760 - }, - "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 343333120 - }, - "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 343988480 - }, - "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 344643840 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 345299200 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 345954560 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 346609920 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 347265280 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_1_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 347920640 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 348576000 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 349231360 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 349886720 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 350542080 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 351197440 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 352508160 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 353818880 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 354474240 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 355129600 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 355784960 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 356440320 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 359061760 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 361683200 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 364304640 - }, - "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 364960000 - }, - "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 365615360 - }, - "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 366270720 - }, - "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 366926080 - }, - "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 367581440 - }, - "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 368236800 - }, - "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 368892160 - }, - "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 369547520 - }, - "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 370202880 - }, - "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 370858240 - }, - "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 371513600 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 372168960 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 372824320 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 373479680 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 374135040 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_1_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 374790400 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 375445760 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 376101120 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 376756480 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 377411840 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 378067200 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 379377920 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 380688640 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 381344000 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 381999360 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 382654720 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 383310080 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 385931520 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 388552960 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 391174400 - }, - "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 391829760 - }, - "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 392485120 - }, - "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 393140480 - }, - "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 393795840 - }, - "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 393959680 - }, - "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394123520 - }, - "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394287360 - }, - "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394451200 - }, - "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394615040 - }, - "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394778880 - }, - "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 394942720 - }, - "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395106560 - }, - "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395270400 - }, - "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395434240 - }, - "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395598080 - }, - "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395761920 - }, - "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 395925760 - }, - "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396089600 - }, - "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396253440 - }, - "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396417280 - }, - "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396581120 - }, - "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396744960 - }, - "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 396908800 - }, - "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 397072640 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 397236480 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 397400320 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 397564160 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 397728000 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 397891840 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 398219520 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 398547200 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 398874880 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 399202560 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 399366400 - }, - "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 399530240 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 399694080 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 399857920 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 64, - 160 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 400021760 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 400349440 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 400677120 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 400840960 - }, - "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 401004800 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 401168640 - }, - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 5120 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 401332480 - }, - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 5120 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 401987840 - }, - "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 5120 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 402643200 - }, - "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 403298560 - }, - "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 403462400 - }, - "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 403626240 - }, - "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 403790080 - }, - "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 403953920 - }, - "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 404117760 - }, - "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 404281600 - }, - "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 404445440 - }, - "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 404609280 - }, - "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 404773120 - }, - "/up_blocks.0/Concat.out19_1_bfp.out20_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 404936960 - }, - "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 405264640 - }, - "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 405592320 - }, - "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 405756160 - }, - "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 405920000 - }, - "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 406083840 - }, - "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 406247680 - }, - "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 406411520 - }, - "/up_blocks.0/Concat_1.out19_2_bfp.out20_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 406575360 - }, - "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 406903040 - }, - "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 407230720 - }, - "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 407394560 - }, - "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 407558400 - }, - "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 407722240 - }, - "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 407886080 - }, - "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 408049920 - }, - "/up_blocks.0/Concat_2.out19_3_bfp.out20_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 408213760 - }, - "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 2560 - ], - "size_in_bytes": 327680, - "op_tensor_size": 327680, - "offset": 408541440 - }, - "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 408869120 - }, - "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 409032960 - }, - "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 409196800 - }, - "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 409360640 - }, - "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 409524480 - }, - "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 8, - 1280 - ], - "size_in_bytes": 163840, - "op_tensor_size": 163840, - "offset": 409688320 - }, - "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 409852160 - }, - "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 410507520 - }, - "/up_blocks.1/Concat.out19_4_bfp.out20_3": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 2560 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 411162880 - }, - "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 2560 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 412473600 - }, - "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 413784320 - }, - "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 414439680 - }, - "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 415095040 - }, - "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 415750400 - }, - "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 416405760 - }, - "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 417061120 - }, - "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 417716480 - }, - "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 418371840 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 419027200 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 419682560 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 420337920 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 420993280 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_1_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 421648640 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 422304000 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 422959360 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 423614720 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 424270080 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 424925440 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 426236160 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 427546880 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 428202240 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 428857600 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 429512960 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 430168320 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 432789760 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 435411200 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 438032640 - }, - "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 438688000 - }, - "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 439343360 - }, - "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 439998720 - }, - "/up_blocks.1/Concat_1.out19_5_bfp.out20_4": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 2560 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 440654080 - }, - "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 2560 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 441964800 - }, - "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 443275520 - }, - "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 443930880 - }, - "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 444586240 - }, - "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 445241600 - }, - "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 445896960 - }, - "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 446552320 - }, - "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 447207680 - }, - "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 447863040 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 448518400 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 449173760 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 449829120 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 450484480 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_1_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 451139840 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 451795200 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 452450560 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 453105920 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 453761280 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 454416640 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 455727360 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 457038080 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 457693440 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 458348800 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 459004160 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 459659520 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 462280960 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 464902400 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 467523840 - }, - "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 468179200 - }, - "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 468834560 - }, - "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 469489920 - }, - "/up_blocks.1/Concat_2.out19_6_bfp.out20_5": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1920 - ], - "size_in_bytes": 983040, - "op_tensor_size": 983040, - "offset": 470145280 - }, - "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1920 - ], - "size_in_bytes": 983040, - "op_tensor_size": 983040, - "offset": 471128320 - }, - "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 472111360 - }, - "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 472766720 - }, - "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 473422080 - }, - "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 474077440 - }, - "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 474732800 - }, - "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 475388160 - }, - "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 476043520 - }, - "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 476698880 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 477354240 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 478009600 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 478664960 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 479320320 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_1_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 479975680 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 480631040 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 481286400 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 481941760 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 482597120 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 256, - 160 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 483252480 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 484563200 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 485873920 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 486529280 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 487184640 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 487840000 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 488495360 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 491116800 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 5120 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 493738240 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 256, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 496359680 - }, - "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 497015040 - }, - "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 497670400 - }, - "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 16, - 16, - 1280 - ], - "size_in_bytes": 655360, - "op_tensor_size": 655360, - "offset": 498325760 - }, - "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1280 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 498981120 - }, - "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1280 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 501602560 - }, - "/up_blocks.2/Concat.out19_7_bfp.out20_6": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1920 - ], - "size_in_bytes": 3932160, - "op_tensor_size": 3932160, - "offset": 504224000 - }, - "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1920 - ], - "size_in_bytes": 3932160, - "op_tensor_size": 3932160, - "offset": 508156160 - }, - "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 512088320 - }, - "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 513399040 - }, - "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 514709760 - }, - "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 516020480 - }, - "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 517331200 - }, - "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 518641920 - }, - "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 519952640 - }, - "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 521263360 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 522574080 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 523884800 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 525195520 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 526506240 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_1_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 527816960 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 529127680 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 530438400 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 531749120 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 533059840 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 534370560 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 536992000 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 539613440 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 540924160 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 542234880 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 543545600 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 544856320 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 550099200 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 555342080 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 560584960 - }, - "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 561895680 - }, - "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 563206400 - }, - "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 564517120 - }, - "/up_blocks.2/Concat_1.out19_8_bfp.out20_7": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1280 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 565827840 - }, - "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 1280 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 568449280 - }, - "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 571070720 - }, - "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 572381440 - }, - "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 573692160 - }, - "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 575002880 - }, - "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 576313600 - }, - "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 577624320 - }, - "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 578935040 - }, - "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 580245760 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 581556480 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 582867200 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 584177920 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 585488640 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_1_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 586799360 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 588110080 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 589420800 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 590731520 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 592042240 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 593352960 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 595974400 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 598595840 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 599906560 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 601217280 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 602528000 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 603838720 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 609081600 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 614324480 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 619567360 - }, - "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 620878080 - }, - "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 622188800 - }, - "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 623499520 - }, - "/up_blocks.2/Concat_2.out19_9_bfp.out20_8": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 960 - ], - "size_in_bytes": 1966080, - "op_tensor_size": 1966080, - "offset": 624810240 - }, - "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 960 - ], - "size_in_bytes": 1966080, - "op_tensor_size": 1966080, - "offset": 626776320 - }, - "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 628742400 - }, - "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 630053120 - }, - "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 631363840 - }, - "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 632674560 - }, - "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 633985280 - }, - "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 635296000 - }, - "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 636606720 - }, - "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 637917440 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 639228160 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 640538880 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 641849600 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 643160320 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_1_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 644471040 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 645781760 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 647092480 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 648403200 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 649713920 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 1024, - 80 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 651024640 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 653646080 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 656267520 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 657578240 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 658888960 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 660199680 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 661510400 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 666753280 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 2560 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 671996160 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 1024, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 677239040 - }, - "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 678549760 - }, - "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 679860480 - }, - "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 32, - 32, - 640 - ], - "size_in_bytes": 1310720, - "op_tensor_size": 1310720, - "offset": 681171200 - }, - "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 682481920 - }, - "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 687724800 - }, - "/up_blocks.3/Concat.out19_10_bfp.out20_9": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 960 - ], - "size_in_bytes": 7864320, - "op_tensor_size": 7864320, - "offset": 692967680 - }, - "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 960 - ], - "size_in_bytes": 7864320, - "op_tensor_size": 7864320, - "offset": 700832000 - }, - "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 708696320 - }, - "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 711317760 - }, - "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 713939200 - }, - "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 716560640 - }, - "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 719182080 - }, - "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 721803520 - }, - "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 724424960 - }, - "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 727046400 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 729667840 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 732289280 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 734910720 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 737532160 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_1_12": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 740153600 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 742775040 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 745396480 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 748017920 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 750639360 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 753260800 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 758503680 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 763746560 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 766368000 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 768989440 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 771610880 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 774232320 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 784718080 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 795203840 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 805689600 - }, - "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 808311040 - }, - "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 810932480 - }, - "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 813553920 - }, - "/up_blocks.3/Concat_1.out19_11_bfp.out20_10": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 816175360 - }, - "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 821418240 - }, - "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 826661120 - }, - "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 829282560 - }, - "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 831904000 - }, - "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 834525440 - }, - "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 837146880 - }, - "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 839768320 - }, - "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 842389760 - }, - "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 845011200 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 847632640 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 850254080 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 852875520 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 855496960 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_1_13": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 858118400 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 860739840 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 863361280 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 865982720 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 868604160 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 871225600 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 876468480 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 881711360 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 884332800 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 886954240 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 889575680 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 892197120 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 902682880 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 913168640 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 923654400 - }, - "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 926275840 - }, - "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 928897280 - }, - "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 931518720 - }, - "/up_blocks.3/Concat_2.out19_12_bfp.out20_11": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 934140160 - }, - "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 640 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 939383040 - }, - "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 944625920 - }, - "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 947247360 - }, - "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 949868800 - }, - "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 952490240 - }, - "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 955111680 - }, - "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 957733120 - }, - "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 960354560 - }, - "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 962976000 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 965597440 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 968218880 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 970840320 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 973461760 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_1_14": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 976083200 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 978704640 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 981326080 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 983947520 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 986568960 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 8, - 4096, - 40 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 989190400 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 994433280 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 999676160 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1002297600 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1004919040 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1007540480 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 1010161920 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 1020647680 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 1280 - ], - "size_in_bytes": 10485760, - "op_tensor_size": 10485760, - "offset": 1031133440 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 4096, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1041619200 - }, - "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1044240640 - }, - "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1046862080 - }, - "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1049483520 - }, - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "uint8", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 2621440, - "op_tensor_size": 2621440, - "offset": 1052104960 - }, - "GroupNorm_60.out7_60.out6_0_44": { - "packed_buffer_label": "scratch", - "xrt_arg_id": 2, - "dtype": "bfloat16", - "shape": [ - 2, - 64, - 64, - 320 - ], - "size_in_bytes": 5242880, - "op_tensor_size": 5242880, - "offset": 1054726400 - }, - "NhwcConv_0_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 31040 - ], - "size_in_bytes": 31040, - "op_tensor_size": 31040, - "offset": 0, - "file_name": ".cache/NhwcConv_0-conv_inConv_0.const", - "file_size": 31040 - }, - "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts7_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 31040, - "file_name": ".cache/NhwcConv_0-conv_inConv_1.const", - "file_size": 128 - }, - "GroupNorm_0_wts_6_0_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 31168, - "file_name": ".cache/NhwcConv_0-conv_inConv_2.const", - "file_size": 1280 - }, - "onnx::MatMul_5660": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 32448, - "file_name": ".cache/NhwcConv_0-conv_inConv_3.const", - "file_size": 281600 - }, - "onnx::MatMul_5661": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 314048, - "file_name": ".cache/NhwcConv_0-conv_inConv_4.const", - "file_size": 281600 - }, - "onnx::MatMul_5690": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 595648, - "file_name": ".cache/NhwcConv_0-conv_inConv_5.const", - "file_size": 281600 - }, - "onnx::MatMul_5691": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 877248, - "file_name": ".cache/NhwcConv_0-conv_inConv_6.const", - "file_size": 281600 - }, - "onnx::MatMul_5720": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 1158848, - "file_name": ".cache/NhwcConv_0-conv_inConv_7.const", - "file_size": 563200 - }, - "onnx::MatMul_5721": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 1722048, - "file_name": ".cache/NhwcConv_0-conv_inConv_8.const", - "file_size": 563200 - }, - "onnx::MatMul_5750": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 2285248, - "file_name": ".cache/NhwcConv_0-conv_inConv_9.const", - "file_size": 563200 - }, - "onnx::MatMul_5751": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 2848448, - "file_name": ".cache/NhwcConv_0-conv_inConv_10.const", - "file_size": 563200 - }, - "onnx::MatMul_5780": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 3411648, - "file_name": ".cache/NhwcConv_0-conv_inConv_11.const", - "file_size": 1121280 - }, - "onnx::MatMul_5781": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 4532928, - "file_name": ".cache/NhwcConv_0-conv_inConv_12.const", - "file_size": 1121280 - }, - "onnx::MatMul_5810": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 5654208, - "file_name": ".cache/NhwcConv_0-conv_inConv_13.const", - "file_size": 1121280 - }, - "onnx::MatMul_5811": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 6775488, - "file_name": ".cache/NhwcConv_0-conv_inConv_14.const", - "file_size": 1121280 - }, - "onnx::MatMul_5848": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 7896768, - "file_name": ".cache/NhwcConv_0-conv_inConv_15.const", - "file_size": 1121280 - }, - "onnx::MatMul_5849": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 9018048, - "file_name": ".cache/NhwcConv_0-conv_inConv_16.const", - "file_size": 1121280 - }, - "time_embedding.linear_1.weight_11_1_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 10139328, - "file_name": ".cache/NhwcConv_0-conv_inConv_17.const", - "file_size": 471040 - }, - "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 128 - ], - "size_in_bytes": 256, - "op_tensor_size": 256, - "offset": 10610368, - "file_name": ".cache/NhwcConv_0-conv_inConv_18.const", - "file_size": 256 - }, - "time_embedding.linear_2.weight_11_1_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 10610624, - "file_name": ".cache/NhwcConv_0-conv_inConv_19.const", - "file_size": 1868800 - }, - "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 128 - ], - "size_in_bytes": 256, - "op_tensor_size": 256, - "offset": 12479424, - "file_name": ".cache/NhwcConv_0-conv_inConv_20.const", - "file_size": 256 - }, - "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 467200 - ], - "size_in_bytes": 467200, - "op_tensor_size": 467200, - "offset": 12479680, - "file_name": ".cache/NhwcConv_0-conv_inConv_21.const", - "file_size": 467200 - }, - "NhwcConv_1_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 12946880, - "file_name": ".cache/NhwcConv_0-conv_inConv_22.const", - "file_size": 1077760 - }, - "GroupNorm_1_wts_6_0_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 14024640, - "file_name": ".cache/NhwcConv_0-conv_inConv_23.const", - "file_size": 1280 - }, - "NhwcConv_2_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 14025920, - "file_name": ".cache/NhwcConv_0-conv_inConv_24.const", - "file_size": 1077760 - }, - "GroupNorm_2_wts_6_2_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 15103680, - "file_name": ".cache/NhwcConv_0-conv_inConv_25.const", - "file_size": 1280 - }, - "NhwcConv_3_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 15104960, - "file_name": ".cache/NhwcConv_0-conv_inConv_26.const", - "file_size": 125440 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15230400, - "file_name": ".cache/NhwcConv_0-conv_inConv_27.const", - "file_size": 640 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15231040, - "file_name": ".cache/NhwcConv_0-conv_inConv_28.const", - "file_size": 640 - }, - "Attention_0_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 15231680, - "file_name": ".cache/NhwcConv_0-conv_inConv_29.const", - "file_size": 118400 - }, - "Attention_0_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 15350080, - "file_name": ".cache/NhwcConv_0-conv_inConv_30.const", - "file_size": 118400 - }, - "Attention_0_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 15468480, - "file_name": ".cache/NhwcConv_0-conv_inConv_31.const", - "file_size": 118400 - }, - "onnx::MatMul_5658_11_0_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 15586880, - "file_name": ".cache/NhwcConv_0-conv_inConv_32.const", - "file_size": 117760 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15704640, - "file_name": ".cache/NhwcConv_0-conv_inConv_33.const", - "file_size": 640 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15705280, - "file_name": ".cache/NhwcConv_0-conv_inConv_34.const", - "file_size": 640 - }, - "onnx::MatMul_5659": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 15705920, - "file_name": ".cache/NhwcConv_0-conv_inConv_35.const", - "file_size": 118400 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0.wts9_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 15824320, - "file_name": ".cache/NhwcConv_0-conv_inConv_36.const", - "file_size": 128 - }, - "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts9_76": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 15824448, - "file_name": ".cache/NhwcConv_0-conv_inConv_37.const", - "file_size": 128 - }, - "onnx::MatMul_5669_11_0_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 15824576, - "file_name": ".cache/NhwcConv_0-conv_inConv_38.const", - "file_size": 117760 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15942336, - "file_name": ".cache/NhwcConv_0-conv_inConv_39.const", - "file_size": 640 - }, - "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 15942976, - "file_name": ".cache/NhwcConv_0-conv_inConv_40.const", - "file_size": 640 - }, - "onnx::MatMul_5670_11_0_2_12_0_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 15943616, - "file_name": ".cache/NhwcConv_0-conv_inConv_41.const", - "file_size": 471040 - }, - "onnx::MatMul_5670_11_0_2_12_0_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 16414656, - "file_name": ".cache/NhwcConv_0-conv_inConv_42.const", - "file_size": 471040 - }, - "onnx::MatMul_5671_11_0_3": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 16885696, - "file_name": ".cache/NhwcConv_0-conv_inConv_43.const", - "file_size": 471040 - }, - "NhwcConv_4_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 17356736, - "file_name": ".cache/NhwcConv_0-conv_inConv_44.const", - "file_size": 125440 - }, - "GroupNorm_3_wts_6_0_2": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 17482176, - "file_name": ".cache/NhwcConv_0-conv_inConv_45.const", - "file_size": 1280 - }, - "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 467200 - ], - "size_in_bytes": 467200, - "op_tensor_size": 467200, - "offset": 17483456, - "file_name": ".cache/NhwcConv_0-conv_inConv_46.const", - "file_size": 467200 - }, - "NhwcConv_5_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 17950656, - "file_name": ".cache/NhwcConv_0-conv_inConv_47.const", - "file_size": 1077760 - }, - "GroupNorm_4_wts_6_0_3": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 19028416, - "file_name": ".cache/NhwcConv_0-conv_inConv_48.const", - "file_size": 1280 - }, - "NhwcConv_6_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 19029696, - "file_name": ".cache/NhwcConv_0-conv_inConv_49.const", - "file_size": 1077760 - }, - "GroupNorm_5_wts_6_2_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 20107456, - "file_name": ".cache/NhwcConv_0-conv_inConv_50.const", - "file_size": 1280 - }, - "NhwcConv_7_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 20108736, - "file_name": ".cache/NhwcConv_0-conv_inConv_51.const", - "file_size": 125440 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20234176, - "file_name": ".cache/NhwcConv_0-conv_inConv_52.const", - "file_size": 640 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20234816, - "file_name": ".cache/NhwcConv_0-conv_inConv_53.const", - "file_size": 640 - }, - "Attention_1_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 20235456, - "file_name": ".cache/NhwcConv_0-conv_inConv_54.const", - "file_size": 118400 - }, - "Attention_1_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 20353856, - "file_name": ".cache/NhwcConv_0-conv_inConv_55.const", - "file_size": 118400 - }, - "Attention_1_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 20472256, - "file_name": ".cache/NhwcConv_0-conv_inConv_56.const", - "file_size": 118400 - }, - "onnx::MatMul_5688_11_0_4": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 20590656, - "file_name": ".cache/NhwcConv_0-conv_inConv_57.const", - "file_size": 117760 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20708416, - "file_name": ".cache/NhwcConv_0-conv_inConv_58.const", - "file_size": 640 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20709056, - "file_name": ".cache/NhwcConv_0-conv_inConv_59.const", - "file_size": 640 - }, - "onnx::MatMul_5689": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 20709696, - "file_name": ".cache/NhwcConv_0-conv_inConv_60.const", - "file_size": 118400 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3.wts9_3": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 20828096, - "file_name": ".cache/NhwcConv_0-conv_inConv_61.const", - "file_size": 128 - }, - "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts9_84": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 20828224, - "file_name": ".cache/NhwcConv_0-conv_inConv_62.const", - "file_size": 128 - }, - "onnx::MatMul_5699_11_0_5": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 20828352, - "file_name": ".cache/NhwcConv_0-conv_inConv_63.const", - "file_size": 117760 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20946112, - "file_name": ".cache/NhwcConv_0-conv_inConv_64.const", - "file_size": 640 - }, - "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 20946752, - "file_name": ".cache/NhwcConv_0-conv_inConv_65.const", - "file_size": 640 - }, - "onnx::MatMul_5700_11_0_6_12_1_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 20947392, - "file_name": ".cache/NhwcConv_0-conv_inConv_66.const", - "file_size": 471040 - }, - "onnx::MatMul_5700_11_0_6_12_1_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 21418432, - "file_name": ".cache/NhwcConv_0-conv_inConv_67.const", - "file_size": 471040 - }, - "onnx::MatMul_5701_11_0_7": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 21889472, - "file_name": ".cache/NhwcConv_0-conv_inConv_68.const", - "file_size": 471040 - }, - "NhwcConv_8_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 22360512, - "file_name": ".cache/NhwcConv_0-conv_inConv_69.const", - "file_size": 125440 - }, - "NhwcConv_9_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1062400 - ], - "size_in_bytes": 1062400, - "op_tensor_size": 1062400, - "offset": 22485952, - "file_name": ".cache/NhwcConv_0-conv_inConv_70.const", - "file_size": 1062400 - }, - "GroupNorm_6_wts_6_0_4": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 23548352, - "file_name": ".cache/NhwcConv_0-conv_inConv_71.const", - "file_size": 1280 - }, - "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 934400 - ], - "size_in_bytes": 934400, - "op_tensor_size": 934400, - "offset": 23549632, - "file_name": ".cache/NhwcConv_0-conv_inConv_72.const", - "file_size": 934400 - }, - "NhwcConv_10_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2155520 - ], - "size_in_bytes": 2155520, - "op_tensor_size": 2155520, - "offset": 24484032, - "file_name": ".cache/NhwcConv_0-conv_inConv_73.const", - "file_size": 2155520 - }, - "GroupNorm_7_wts_6_0_5": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 26639552, - "file_name": ".cache/NhwcConv_0-conv_inConv_74.const", - "file_size": 2560 - }, - "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 934400 - ], - "size_in_bytes": 934400, - "op_tensor_size": 934400, - "offset": 26642112, - "file_name": ".cache/NhwcConv_0-conv_inConv_75.const", - "file_size": 934400 - }, - "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 27576512, - "file_name": ".cache/NhwcConv_0-conv_inConv_76.const", - "file_size": 1868800 - }, - "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 29445312, - "file_name": ".cache/NhwcConv_0-conv_inConv_77.const", - "file_size": 1868800 - }, - "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 31314112, - "file_name": ".cache/NhwcConv_0-conv_inConv_78.const", - "file_size": 1868800 - }, - "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 33182912, - "file_name": ".cache/NhwcConv_0-conv_inConv_79.const", - "file_size": 1868800 - }, - "mid_block.resnets.0.time_emb_proj.weight_11_1_10": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 35051712, - "file_name": ".cache/NhwcConv_0-conv_inConv_80.const", - "file_size": 1868800 - }, - "mid_block.resnets.1.time_emb_proj.weight_11_1_11": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 36920512, - "file_name": ".cache/NhwcConv_0-conv_inConv_81.const", - "file_size": 1868800 - }, - "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 38789312, - "file_name": ".cache/NhwcConv_0-conv_inConv_82.const", - "file_size": 1868800 - }, - "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 40658112, - "file_name": ".cache/NhwcConv_0-conv_inConv_83.const", - "file_size": 1868800 - }, - "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 42526912, - "file_name": ".cache/NhwcConv_0-conv_inConv_84.const", - "file_size": 1868800 - }, - "onnx::MatMul_5895": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 44395712, - "file_name": ".cache/NhwcConv_0-conv_inConv_85.const", - "file_size": 1121280 - }, - "onnx::MatMul_5896": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 45516992, - "file_name": ".cache/NhwcConv_0-conv_inConv_86.const", - "file_size": 1121280 - }, - "onnx::MatMul_5925": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 46638272, - "file_name": ".cache/NhwcConv_0-conv_inConv_87.const", - "file_size": 1121280 - }, - "onnx::MatMul_5926": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 47759552, - "file_name": ".cache/NhwcConv_0-conv_inConv_88.const", - "file_size": 1121280 - }, - "onnx::MatMul_5955": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 48880832, - "file_name": ".cache/NhwcConv_0-conv_inConv_89.const", - "file_size": 1121280 - }, - "onnx::MatMul_5956": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1121280 - ], - "size_in_bytes": 1121280, - "op_tensor_size": 1121280, - "offset": 50002112, - "file_name": ".cache/NhwcConv_0-conv_inConv_90.const", - "file_size": 1121280 - }, - "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 51123392, - "file_name": ".cache/NhwcConv_0-conv_inConv_91.const", - "file_size": 1868800 - }, - "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 52992192, - "file_name": ".cache/NhwcConv_0-conv_inConv_92.const", - "file_size": 1868800 - }, - "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 54860992, - "file_name": ".cache/NhwcConv_0-conv_inConv_93.const", - "file_size": 1868800 - }, - "onnx::MatMul_5986": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 56729792, - "file_name": ".cache/NhwcConv_0-conv_inConv_94.const", - "file_size": 563200 - }, - "onnx::MatMul_5987": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 57292992, - "file_name": ".cache/NhwcConv_0-conv_inConv_95.const", - "file_size": 563200 - }, - "onnx::MatMul_6016": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 57856192, - "file_name": ".cache/NhwcConv_0-conv_inConv_96.const", - "file_size": 563200 - }, - "onnx::MatMul_6017": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 58419392, - "file_name": ".cache/NhwcConv_0-conv_inConv_97.const", - "file_size": 563200 - }, - "onnx::MatMul_6046": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 58982592, - "file_name": ".cache/NhwcConv_0-conv_inConv_98.const", - "file_size": 563200 - }, - "onnx::MatMul_6047": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 563200 - ], - "size_in_bytes": 563200, - "op_tensor_size": 563200, - "offset": 59545792, - "file_name": ".cache/NhwcConv_0-conv_inConv_99.const", - "file_size": 563200 - }, - "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 934400 - ], - "size_in_bytes": 934400, - "op_tensor_size": 934400, - "offset": 60108992, - "file_name": ".cache/NhwcConv_0-conv_inConv_100.const", - "file_size": 934400 - }, - "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 934400 - ], - "size_in_bytes": 934400, - "op_tensor_size": 934400, - "offset": 61043392, - "file_name": ".cache/NhwcConv_0-conv_inConv_101.const", - "file_size": 934400 - }, - "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 934400 - ], - "size_in_bytes": 934400, - "op_tensor_size": 934400, - "offset": 61977792, - "file_name": ".cache/NhwcConv_0-conv_inConv_102.const", - "file_size": 934400 - }, - "onnx::MatMul_6077": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 62912192, - "file_name": ".cache/NhwcConv_0-conv_inConv_103.const", - "file_size": 281600 - }, - "onnx::MatMul_6078": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 63193792, - "file_name": ".cache/NhwcConv_0-conv_inConv_104.const", - "file_size": 281600 - }, - "onnx::MatMul_6107": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 63475392, - "file_name": ".cache/NhwcConv_0-conv_inConv_105.const", - "file_size": 281600 - }, - "onnx::MatMul_6108": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 63756992, - "file_name": ".cache/NhwcConv_0-conv_inConv_106.const", - "file_size": 281600 - }, - "onnx::MatMul_6137": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 64038592, - "file_name": ".cache/NhwcConv_0-conv_inConv_107.const", - "file_size": 281600 - }, - "onnx::MatMul_6138": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 281600 - ], - "size_in_bytes": 281600, - "op_tensor_size": 281600, - "offset": 64320192, - "file_name": ".cache/NhwcConv_0-conv_inConv_108.const", - "file_size": 281600 - }, - "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 467200 - ], - "size_in_bytes": 467200, - "op_tensor_size": 467200, - "offset": 64601792, - "file_name": ".cache/NhwcConv_0-conv_inConv_109.const", - "file_size": 467200 - }, - "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 467200 - ], - "size_in_bytes": 467200, - "op_tensor_size": 467200, - "offset": 65068992, - "file_name": ".cache/NhwcConv_0-conv_inConv_110.const", - "file_size": 467200 - }, - "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 467200 - ], - "size_in_bytes": 467200, - "op_tensor_size": 467200, - "offset": 65536192, - "file_name": ".cache/NhwcConv_0-conv_inConv_111.const", - "file_size": 467200 - }, - "NhwcConv_11_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 66003392, - "file_name": ".cache/NhwcConv_0-conv_inConv_112.const", - "file_size": 4311040 - }, - "NhwcConv_12_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 250880 - ], - "size_in_bytes": 250880, - "op_tensor_size": 250880, - "offset": 70314432, - "file_name": ".cache/NhwcConv_0-conv_inConv_113.const", - "file_size": 250880 - }, - "GroupNorm_8_wts_6_2_2": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 70565312, - "file_name": ".cache/NhwcConv_0-conv_inConv_114.const", - "file_size": 2560 - }, - "NhwcConv_13_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 70567872, - "file_name": ".cache/NhwcConv_0-conv_inConv_115.const", - "file_size": 501760 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 71069632, - "file_name": ".cache/NhwcConv_0-conv_inConv_116.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 71070912, - "file_name": ".cache/NhwcConv_0-conv_inConv_117.const", - "file_size": 1280 - }, - "Attention_2_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 71072192, - "file_name": ".cache/NhwcConv_0-conv_inConv_118.const", - "file_size": 471040 - }, - "Attention_2_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 71543232, - "file_name": ".cache/NhwcConv_0-conv_inConv_119.const", - "file_size": 471040 - }, - "Attention_2_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 72014272, - "file_name": ".cache/NhwcConv_0-conv_inConv_120.const", - "file_size": 471040 - }, - "onnx::MatMul_5718_11_0_8": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 72485312, - "file_name": ".cache/NhwcConv_0-conv_inConv_121.const", - "file_size": 473600 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 72958912, - "file_name": ".cache/NhwcConv_0-conv_inConv_122.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 72960192, - "file_name": ".cache/NhwcConv_0-conv_inConv_123.const", - "file_size": 1280 - }, - "onnx::MatMul_5719": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 72961472, - "file_name": ".cache/NhwcConv_0-conv_inConv_124.const", - "file_size": 471040 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6.wts9_6": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 73432512, - "file_name": ".cache/NhwcConv_0-conv_inConv_125.const", - "file_size": 128 - }, - "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts9_92": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 73432640, - "file_name": ".cache/NhwcConv_0-conv_inConv_126.const", - "file_size": 128 - }, - "onnx::MatMul_5729_11_0_9": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 73432768, - "file_name": ".cache/NhwcConv_0-conv_inConv_127.const", - "file_size": 473600 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 73906368, - "file_name": ".cache/NhwcConv_0-conv_inConv_128.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 73907648, - "file_name": ".cache/NhwcConv_0-conv_inConv_129.const", - "file_size": 1280 - }, - "onnx::MatMul_5730_11_0_10_12_2_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 73908928, - "file_name": ".cache/NhwcConv_0-conv_inConv_130.const", - "file_size": 1868800 - }, - "onnx::MatMul_5730_11_0_10_12_2_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 75777728, - "file_name": ".cache/NhwcConv_0-conv_inConv_131.const", - "file_size": 1868800 - }, - "onnx::MatMul_5731_11_0_11": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1884160 - ], - "size_in_bytes": 1884160, - "op_tensor_size": 1884160, - "offset": 77646528, - "file_name": ".cache/NhwcConv_0-conv_inConv_132.const", - "file_size": 1884160 - }, - "NhwcConv_14_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 79530688, - "file_name": ".cache/NhwcConv_0-conv_inConv_133.const", - "file_size": 501760 - }, - "GroupNorm_9_wts_6_0_6": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 80032448, - "file_name": ".cache/NhwcConv_0-conv_inConv_134.const", - "file_size": 2560 - }, - "NhwcConv_15_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 80035008, - "file_name": ".cache/NhwcConv_0-conv_inConv_135.const", - "file_size": 4311040 - }, - "GroupNorm_10_wts_6_0_7": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 84346048, - "file_name": ".cache/NhwcConv_0-conv_inConv_136.const", - "file_size": 2560 - }, - "NhwcConv_16_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 84348608, - "file_name": ".cache/NhwcConv_0-conv_inConv_137.const", - "file_size": 4311040 - }, - "GroupNorm_11_wts_6_2_3": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 88659648, - "file_name": ".cache/NhwcConv_0-conv_inConv_138.const", - "file_size": 2560 - }, - "NhwcConv_17_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 88662208, - "file_name": ".cache/NhwcConv_0-conv_inConv_139.const", - "file_size": 501760 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 89163968, - "file_name": ".cache/NhwcConv_0-conv_inConv_140.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 89165248, - "file_name": ".cache/NhwcConv_0-conv_inConv_141.const", - "file_size": 1280 - }, - "Attention_3_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 89166528, - "file_name": ".cache/NhwcConv_0-conv_inConv_142.const", - "file_size": 471040 - }, - "Attention_3_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 89637568, - "file_name": ".cache/NhwcConv_0-conv_inConv_143.const", - "file_size": 471040 - }, - "Attention_3_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 90108608, - "file_name": ".cache/NhwcConv_0-conv_inConv_144.const", - "file_size": 471040 - }, - "onnx::MatMul_5748_11_0_12": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 90579648, - "file_name": ".cache/NhwcConv_0-conv_inConv_145.const", - "file_size": 473600 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 91053248, - "file_name": ".cache/NhwcConv_0-conv_inConv_146.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 91054528, - "file_name": ".cache/NhwcConv_0-conv_inConv_147.const", - "file_size": 1280 - }, - "onnx::MatMul_5749": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 91055808, - "file_name": ".cache/NhwcConv_0-conv_inConv_148.const", - "file_size": 471040 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9.wts9_9": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 91526848, - "file_name": ".cache/NhwcConv_0-conv_inConv_149.const", - "file_size": 128 - }, - "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts9_100": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 91526976, - "file_name": ".cache/NhwcConv_0-conv_inConv_150.const", - "file_size": 128 - }, - "onnx::MatMul_5759_11_0_13": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 91527104, - "file_name": ".cache/NhwcConv_0-conv_inConv_151.const", - "file_size": 473600 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 92000704, - "file_name": ".cache/NhwcConv_0-conv_inConv_152.const", - "file_size": 1280 - }, - "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 92001984, - "file_name": ".cache/NhwcConv_0-conv_inConv_153.const", - "file_size": 1280 - }, - "onnx::MatMul_5760_11_0_14_12_3_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 92003264, - "file_name": ".cache/NhwcConv_0-conv_inConv_154.const", - "file_size": 1868800 - }, - "onnx::MatMul_5760_11_0_14_12_3_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 93872064, - "file_name": ".cache/NhwcConv_0-conv_inConv_155.const", - "file_size": 1868800 - }, - "onnx::MatMul_5761_11_0_15": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1884160 - ], - "size_in_bytes": 1884160, - "op_tensor_size": 1884160, - "offset": 95740864, - "file_name": ".cache/NhwcConv_0-conv_inConv_156.const", - "file_size": 1884160 - }, - "NhwcConv_18_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 97625024, - "file_name": ".cache/NhwcConv_0-conv_inConv_157.const", - "file_size": 501760 - }, - "NhwcConv_19_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4249600 - ], - "size_in_bytes": 4249600, - "op_tensor_size": 4249600, - "offset": 98126784, - "file_name": ".cache/NhwcConv_0-conv_inConv_158.const", - "file_size": 4249600 - }, - "GroupNorm_12_wts_6_0_8": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 102376384, - "file_name": ".cache/NhwcConv_0-conv_inConv_159.const", - "file_size": 2560 - }, - "NhwcConv_20_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 8458240 - ], - "size_in_bytes": 8458240, - "op_tensor_size": 8458240, - "offset": 102378944, - "file_name": ".cache/NhwcConv_0-conv_inConv_160.const", - "file_size": 8458240 - }, - "GroupNorm_13_wts_6_0_9": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 110837184, - "file_name": ".cache/NhwcConv_0-conv_inConv_161.const", - "file_size": 5120 - }, - "NhwcConv_21_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 110842304, - "file_name": ".cache/NhwcConv_0-conv_inConv_162.const", - "file_size": 16916480 - }, - "NhwcConv_22_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1003520 - ], - "size_in_bytes": 1003520, - "op_tensor_size": 1003520, - "offset": 127758784, - "file_name": ".cache/NhwcConv_0-conv_inConv_163.const", - "file_size": 1003520 - }, - "GroupNorm_14_wts_6_2_4": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 128762304, - "file_name": ".cache/NhwcConv_0-conv_inConv_164.const", - "file_size": 5120 - }, - "NhwcConv_23_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 128767424, - "file_name": ".cache/NhwcConv_0-conv_inConv_165.const", - "file_size": 2007040 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 130774464, - "file_name": ".cache/NhwcConv_0-conv_inConv_166.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 130777024, - "file_name": ".cache/NhwcConv_0-conv_inConv_167.const", - "file_size": 2560 - }, - "Attention_4_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 130779584, - "file_name": ".cache/NhwcConv_0-conv_inConv_168.const", - "file_size": 1868800 - }, - "Attention_4_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 132648384, - "file_name": ".cache/NhwcConv_0-conv_inConv_169.const", - "file_size": 1868800 - }, - "Attention_4_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 134517184, - "file_name": ".cache/NhwcConv_0-conv_inConv_170.const", - "file_size": 1868800 - }, - "onnx::MatMul_5778_11_0_16": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 136385984, - "file_name": ".cache/NhwcConv_0-conv_inConv_171.const", - "file_size": 1868800 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 138254784, - "file_name": ".cache/NhwcConv_0-conv_inConv_172.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 138257344, - "file_name": ".cache/NhwcConv_0-conv_inConv_173.const", - "file_size": 2560 - }, - "onnx::MatMul_5779": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 138259904, - "file_name": ".cache/NhwcConv_0-conv_inConv_174.const", - "file_size": 1868800 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12.wts9_12": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 140128704, - "file_name": ".cache/NhwcConv_0-conv_inConv_175.const", - "file_size": 128 - }, - "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts9_108": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 140128832, - "file_name": ".cache/NhwcConv_0-conv_inConv_176.const", - "file_size": 128 - }, - "onnx::MatMul_5789_11_0_17": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 140128960, - "file_name": ".cache/NhwcConv_0-conv_inConv_177.const", - "file_size": 1868800 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 141997760, - "file_name": ".cache/NhwcConv_0-conv_inConv_178.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 142000320, - "file_name": ".cache/NhwcConv_0-conv_inConv_179.const", - "file_size": 2560 - }, - "onnx::MatMul_5790_11_0_18_12_4_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 142002880, - "file_name": ".cache/NhwcConv_0-conv_inConv_180.const", - "file_size": 7475200 - }, - "onnx::MatMul_5790_11_0_18_12_4_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 149478080, - "file_name": ".cache/NhwcConv_0-conv_inConv_181.const", - "file_size": 7475200 - }, - "onnx::MatMul_5791_11_0_19": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 156953280, - "file_name": ".cache/NhwcConv_0-conv_inConv_182.const", - "file_size": 7475200 - }, - "NhwcConv_24_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 164428480, - "file_name": ".cache/NhwcConv_0-conv_inConv_183.const", - "file_size": 2007040 - }, - "GroupNorm_15_wts_6_0_10": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 166435520, - "file_name": ".cache/NhwcConv_0-conv_inConv_184.const", - "file_size": 5120 - }, - "NhwcConv_25_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 166440640, - "file_name": ".cache/NhwcConv_0-conv_inConv_185.const", - "file_size": 16916480 - }, - "GroupNorm_16_wts_6_0_11": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 183357120, - "file_name": ".cache/NhwcConv_0-conv_inConv_186.const", - "file_size": 5120 - }, - "NhwcConv_26_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 183362240, - "file_name": ".cache/NhwcConv_0-conv_inConv_187.const", - "file_size": 16916480 - }, - "GroupNorm_17_wts_6_2_5": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 200278720, - "file_name": ".cache/NhwcConv_0-conv_inConv_188.const", - "file_size": 5120 - }, - "NhwcConv_27_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 200283840, - "file_name": ".cache/NhwcConv_0-conv_inConv_189.const", - "file_size": 2007040 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 202290880, - "file_name": ".cache/NhwcConv_0-conv_inConv_190.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 202293440, - "file_name": ".cache/NhwcConv_0-conv_inConv_191.const", - "file_size": 2560 - }, - "Attention_5_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 202296000, - "file_name": ".cache/NhwcConv_0-conv_inConv_192.const", - "file_size": 1868800 - }, - "Attention_5_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 204164800, - "file_name": ".cache/NhwcConv_0-conv_inConv_193.const", - "file_size": 1868800 - }, - "Attention_5_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 206033600, - "file_name": ".cache/NhwcConv_0-conv_inConv_194.const", - "file_size": 1868800 - }, - "onnx::MatMul_5808_11_0_20": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 207902400, - "file_name": ".cache/NhwcConv_0-conv_inConv_195.const", - "file_size": 1868800 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 209771200, - "file_name": ".cache/NhwcConv_0-conv_inConv_196.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 209773760, - "file_name": ".cache/NhwcConv_0-conv_inConv_197.const", - "file_size": 2560 - }, - "onnx::MatMul_5809": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 209776320, - "file_name": ".cache/NhwcConv_0-conv_inConv_198.const", - "file_size": 1868800 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15.wts9_15": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 211645120, - "file_name": ".cache/NhwcConv_0-conv_inConv_199.const", - "file_size": 128 - }, - "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts9_116": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 211645248, - "file_name": ".cache/NhwcConv_0-conv_inConv_200.const", - "file_size": 128 - }, - "onnx::MatMul_5819_11_0_21": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 211645376, - "file_name": ".cache/NhwcConv_0-conv_inConv_201.const", - "file_size": 1868800 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 213514176, - "file_name": ".cache/NhwcConv_0-conv_inConv_202.const", - "file_size": 2560 - }, - "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 213516736, - "file_name": ".cache/NhwcConv_0-conv_inConv_203.const", - "file_size": 2560 - }, - "onnx::MatMul_5820_11_0_22_12_5_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 213519296, - "file_name": ".cache/NhwcConv_0-conv_inConv_204.const", - "file_size": 7475200 - }, - "onnx::MatMul_5820_11_0_22_12_5_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 220994496, - "file_name": ".cache/NhwcConv_0-conv_inConv_205.const", - "file_size": 7475200 - }, - "onnx::MatMul_5821_11_0_23": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 228469696, - "file_name": ".cache/NhwcConv_0-conv_inConv_206.const", - "file_size": 7475200 - }, - "NhwcConv_28_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 235944896, - "file_name": ".cache/NhwcConv_0-conv_inConv_207.const", - "file_size": 2007040 - }, - "NhwcConv_29_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 17244160 - ], - "size_in_bytes": 17244160, - "op_tensor_size": 17244160, - "offset": 237951936, - "file_name": ".cache/NhwcConv_0-conv_inConv_208.const", - "file_size": 17244160 - }, - "GroupNorm_18_wts_6_0_12": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 255196096, - "file_name": ".cache/NhwcConv_0-conv_inConv_209.const", - "file_size": 5120 - }, - "NhwcConv_30_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 255201216, - "file_name": ".cache/NhwcConv_0-conv_inConv_210.const", - "file_size": 16916480 - }, - "GroupNorm_19_wts_6_0_13": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 272117696, - "file_name": ".cache/NhwcConv_0-conv_inConv_211.const", - "file_size": 5120 - }, - "NhwcConv_31_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 272122816, - "file_name": ".cache/NhwcConv_0-conv_inConv_212.const", - "file_size": 16916480 - }, - "GroupNorm_20_wts_6_0_14": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 289039296, - "file_name": ".cache/NhwcConv_0-conv_inConv_213.const", - "file_size": 5120 - }, - "NhwcConv_32_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 289044416, - "file_name": ".cache/NhwcConv_0-conv_inConv_214.const", - "file_size": 16916480 - }, - "GroupNorm_21_wts_6_0_15": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 305960896, - "file_name": ".cache/NhwcConv_0-conv_inConv_215.const", - "file_size": 5120 - }, - "NhwcConv_33_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 305966016, - "file_name": ".cache/NhwcConv_0-conv_inConv_216.const", - "file_size": 16916480 - }, - "GroupNorm_22_wts_6_0_16": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 322882496, - "file_name": ".cache/NhwcConv_0-conv_inConv_217.const", - "file_size": 5120 - }, - "NhwcConv_34_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 322887616, - "file_name": ".cache/NhwcConv_0-conv_inConv_218.const", - "file_size": 16916480 - }, - "GroupNorm_23_wts_6_0_17": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 339804096, - "file_name": ".cache/NhwcConv_0-conv_inConv_219.const", - "file_size": 5120 - }, - "NhwcConv_35_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 339809216, - "file_name": ".cache/NhwcConv_0-conv_inConv_220.const", - "file_size": 16916480 - }, - "GroupNorm_24_wts_6_2_6": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 356725696, - "file_name": ".cache/NhwcConv_0-conv_inConv_221.const", - "file_size": 5120 - }, - "NhwcConv_36_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2048000 - ], - "size_in_bytes": 2048000, - "op_tensor_size": 2048000, - "offset": 356730816, - "file_name": ".cache/NhwcConv_0-conv_inConv_222.const", - "file_size": 2048000 - }, - "mid_block.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 358778816, - "file_name": ".cache/NhwcConv_0-conv_inConv_223.const", - "file_size": 2560 - }, - "mid_block.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 358781376, - "file_name": ".cache/NhwcConv_0-conv_inConv_224.const", - "file_size": 2560 - }, - "Attention_6_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 358783936, - "file_name": ".cache/NhwcConv_0-conv_inConv_225.const", - "file_size": 1868800 - }, - "Attention_6_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 360652736, - "file_name": ".cache/NhwcConv_0-conv_inConv_226.const", - "file_size": 1868800 - }, - "Attention_6_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 362521536, - "file_name": ".cache/NhwcConv_0-conv_inConv_227.const", - "file_size": 1868800 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121.wts9_121": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 364390336, - "file_name": ".cache/NhwcConv_0-conv_inConv_228.const", - "file_size": 128 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120.wts9_120": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 364390464, - "file_name": ".cache/NhwcConv_0-conv_inConv_229.const", - "file_size": 128 - }, - "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122.wts9_122": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 364390592, - "file_name": ".cache/NhwcConv_0-conv_inConv_230.const", - "file_size": 128 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts9_123": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 364390720, - "file_name": ".cache/NhwcConv_0-conv_inConv_231.const", - "file_size": 128 - }, - "onnx::MatMul_5846_11_0_24": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 364390848, - "file_name": ".cache/NhwcConv_0-conv_inConv_232.const", - "file_size": 1868800 - }, - "mid_block.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 366259648, - "file_name": ".cache/NhwcConv_0-conv_inConv_233.const", - "file_size": 2560 - }, - "mid_block.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 366262208, - "file_name": ".cache/NhwcConv_0-conv_inConv_234.const", - "file_size": 2560 - }, - "onnx::MatMul_5847": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 366264768, - "file_name": ".cache/NhwcConv_0-conv_inConv_235.const", - "file_size": 1868800 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18.wts9_18": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 368133568, - "file_name": ".cache/NhwcConv_0-conv_inConv_236.const", - "file_size": 128 - }, - "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts9_124": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 368133696, - "file_name": ".cache/NhwcConv_0-conv_inConv_237.const", - "file_size": 128 - }, - "onnx::MatMul_5857_11_0_25": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 368133824, - "file_name": ".cache/NhwcConv_0-conv_inConv_238.const", - "file_size": 1868800 - }, - "mid_block.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 370002624, - "file_name": ".cache/NhwcConv_0-conv_inConv_239.const", - "file_size": 2560 - }, - "mid_block.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 370005184, - "file_name": ".cache/NhwcConv_0-conv_inConv_240.const", - "file_size": 2560 - }, - "onnx::MatMul_5858_11_0_26_12_6_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 370007744, - "file_name": ".cache/NhwcConv_0-conv_inConv_241.const", - "file_size": 7475200 - }, - "onnx::MatMul_5858_11_0_26_12_6_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 377482944, - "file_name": ".cache/NhwcConv_0-conv_inConv_242.const", - "file_size": 7475200 - }, - "onnx::MatMul_5859_11_0_27": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 384958144, - "file_name": ".cache/NhwcConv_0-conv_inConv_243.const", - "file_size": 7475200 - }, - "NhwcConv_37_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2048000 - ], - "size_in_bytes": 2048000, - "op_tensor_size": 2048000, - "offset": 392433344, - "file_name": ".cache/NhwcConv_0-conv_inConv_244.const", - "file_size": 2048000 - }, - "GroupNorm_25_wts_6_0_18": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 394481344, - "file_name": ".cache/NhwcConv_0-conv_inConv_245.const", - "file_size": 5120 - }, - "NhwcConv_38_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 394486464, - "file_name": ".cache/NhwcConv_0-conv_inConv_246.const", - "file_size": 16916480 - }, - "GroupNorm_26_wts_6_0_19": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 411402944, - "file_name": ".cache/NhwcConv_0-conv_inConv_247.const", - "file_size": 5120 - }, - "NhwcConv_39_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 411408064, - "file_name": ".cache/NhwcConv_0-conv_inConv_248.const", - "file_size": 16916480 - }, - "GroupNorm_27_wts_6_0_20": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 5120 - ], - "size_in_bytes": 10240, - "op_tensor_size": 10240, - "offset": 428324544, - "file_name": ".cache/NhwcConv_0-conv_inConv_249.const", - "file_size": 10240 - }, - "NhwcConv_40_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 33832960 - ], - "size_in_bytes": 33832960, - "op_tensor_size": 33832960, - "offset": 428334784, - "file_name": ".cache/NhwcConv_0-conv_inConv_250.const", - "file_size": 33832960 - }, - "GroupNorm_28_wts_6_0_21": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 462167744, - "file_name": ".cache/NhwcConv_0-conv_inConv_251.const", - "file_size": 5120 - }, - "NhwcConv_41_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 462172864, - "file_name": ".cache/NhwcConv_0-conv_inConv_252.const", - "file_size": 16916480 - }, - "NhwcConv_42_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4096000 - ], - "size_in_bytes": 4096000, - "op_tensor_size": 4096000, - "offset": 479089344, - "file_name": ".cache/NhwcConv_0-conv_inConv_253.const", - "file_size": 4096000 - }, - "GroupNorm_29_wts_6_0_22": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 5120 - ], - "size_in_bytes": 10240, - "op_tensor_size": 10240, - "offset": 483185344, - "file_name": ".cache/NhwcConv_0-conv_inConv_254.const", - "file_size": 10240 - }, - "NhwcConv_43_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 33832960 - ], - "size_in_bytes": 33832960, - "op_tensor_size": 33832960, - "offset": 483195584, - "file_name": ".cache/NhwcConv_0-conv_inConv_255.const", - "file_size": 33832960 - }, - "GroupNorm_30_wts_6_0_23": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 517028544, - "file_name": ".cache/NhwcConv_0-conv_inConv_256.const", - "file_size": 5120 - }, - "NhwcConv_44_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 517033664, - "file_name": ".cache/NhwcConv_0-conv_inConv_257.const", - "file_size": 16916480 - }, - "NhwcConv_45_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4096000 - ], - "size_in_bytes": 4096000, - "op_tensor_size": 4096000, - "offset": 533950144, - "file_name": ".cache/NhwcConv_0-conv_inConv_258.const", - "file_size": 4096000 - }, - "GroupNorm_31_wts_6_0_24": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 5120 - ], - "size_in_bytes": 10240, - "op_tensor_size": 10240, - "offset": 538046144, - "file_name": ".cache/NhwcConv_0-conv_inConv_259.const", - "file_size": 10240 - }, - "NhwcConv_46_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 33832960 - ], - "size_in_bytes": 33832960, - "op_tensor_size": 33832960, - "offset": 538056384, - "file_name": ".cache/NhwcConv_0-conv_inConv_260.const", - "file_size": 33832960 - }, - "GroupNorm_32_wts_6_0_25": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 571889344, - "file_name": ".cache/NhwcConv_0-conv_inConv_261.const", - "file_size": 5120 - }, - "NhwcConv_47_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 571894464, - "file_name": ".cache/NhwcConv_0-conv_inConv_262.const", - "file_size": 16916480 - }, - "NhwcConv_48_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4096000 - ], - "size_in_bytes": 4096000, - "op_tensor_size": 4096000, - "offset": 588810944, - "file_name": ".cache/NhwcConv_0-conv_inConv_263.const", - "file_size": 4096000 - }, - "/up_blocks.0/upsamplers.0/Resize.weights3_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 128 - ], - "size_in_bytes": 256, - "op_tensor_size": 256, - "offset": 592906944, - "file_name": ".cache/NhwcConv_0-conv_inConv_264.const", - "file_size": 256 - }, - "NhwcConv_49_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 592907200, - "file_name": ".cache/NhwcConv_0-conv_inConv_265.const", - "file_size": 16916480 - }, - "GroupNorm_33_wts_6_0_26": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 5120 - ], - "size_in_bytes": 10240, - "op_tensor_size": 10240, - "offset": 609823680, - "file_name": ".cache/NhwcConv_0-conv_inConv_266.const", - "file_size": 10240 - }, - "NhwcConv_50_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 33832960 - ], - "size_in_bytes": 33832960, - "op_tensor_size": 33832960, - "offset": 609833920, - "file_name": ".cache/NhwcConv_0-conv_inConv_267.const", - "file_size": 33832960 - }, - "GroupNorm_34_wts_6_0_27": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 643666880, - "file_name": ".cache/NhwcConv_0-conv_inConv_268.const", - "file_size": 5120 - }, - "NhwcConv_51_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 643672000, - "file_name": ".cache/NhwcConv_0-conv_inConv_269.const", - "file_size": 16916480 - }, - "NhwcConv_52_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4014080 - ], - "size_in_bytes": 4014080, - "op_tensor_size": 4014080, - "offset": 660588480, - "file_name": ".cache/NhwcConv_0-conv_inConv_270.const", - "file_size": 4014080 - }, - "GroupNorm_35_wts_6_2_7": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 664602560, - "file_name": ".cache/NhwcConv_0-conv_inConv_271.const", - "file_size": 5120 - }, - "NhwcConv_53_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 664607680, - "file_name": ".cache/NhwcConv_0-conv_inConv_272.const", - "file_size": 2007040 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 666614720, - "file_name": ".cache/NhwcConv_0-conv_inConv_273.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 666617280, - "file_name": ".cache/NhwcConv_0-conv_inConv_274.const", - "file_size": 2560 - }, - "Attention_7_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 666619840, - "file_name": ".cache/NhwcConv_0-conv_inConv_275.const", - "file_size": 1868800 - }, - "Attention_7_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 668488640, - "file_name": ".cache/NhwcConv_0-conv_inConv_276.const", - "file_size": 1868800 - }, - "Attention_7_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 670357440, - "file_name": ".cache/NhwcConv_0-conv_inConv_277.const", - "file_size": 1868800 - }, - "onnx::MatMul_5893_11_0_28": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 672226240, - "file_name": ".cache/NhwcConv_0-conv_inConv_278.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 674095040, - "file_name": ".cache/NhwcConv_0-conv_inConv_279.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 674097600, - "file_name": ".cache/NhwcConv_0-conv_inConv_280.const", - "file_size": 2560 - }, - "onnx::MatMul_5894": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 674100160, - "file_name": ".cache/NhwcConv_0-conv_inConv_281.const", - "file_size": 1868800 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21.wts9_21": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 675968960, - "file_name": ".cache/NhwcConv_0-conv_inConv_282.const", - "file_size": 128 - }, - "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts9_132": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 675969088, - "file_name": ".cache/NhwcConv_0-conv_inConv_283.const", - "file_size": 128 - }, - "onnx::MatMul_5904_11_0_29": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 675969216, - "file_name": ".cache/NhwcConv_0-conv_inConv_284.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 677838016, - "file_name": ".cache/NhwcConv_0-conv_inConv_285.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 677840576, - "file_name": ".cache/NhwcConv_0-conv_inConv_286.const", - "file_size": 2560 - }, - "onnx::MatMul_5905_11_0_30_12_7_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 677843136, - "file_name": ".cache/NhwcConv_0-conv_inConv_287.const", - "file_size": 7475200 - }, - "onnx::MatMul_5905_11_0_30_12_7_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 685318336, - "file_name": ".cache/NhwcConv_0-conv_inConv_288.const", - "file_size": 7475200 - }, - "onnx::MatMul_5906_11_0_31": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 692793536, - "file_name": ".cache/NhwcConv_0-conv_inConv_289.const", - "file_size": 7475200 - }, - "NhwcConv_54_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 700268736, - "file_name": ".cache/NhwcConv_0-conv_inConv_290.const", - "file_size": 2007040 - }, - "GroupNorm_36_wts_6_0_28": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 5120 - ], - "size_in_bytes": 10240, - "op_tensor_size": 10240, - "offset": 702275776, - "file_name": ".cache/NhwcConv_0-conv_inConv_291.const", - "file_size": 10240 - }, - "NhwcConv_55_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 33832960 - ], - "size_in_bytes": 33832960, - "op_tensor_size": 33832960, - "offset": 702286016, - "file_name": ".cache/NhwcConv_0-conv_inConv_292.const", - "file_size": 33832960 - }, - "GroupNorm_37_wts_6_0_29": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 736118976, - "file_name": ".cache/NhwcConv_0-conv_inConv_293.const", - "file_size": 5120 - }, - "NhwcConv_56_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 736124096, - "file_name": ".cache/NhwcConv_0-conv_inConv_294.const", - "file_size": 16916480 - }, - "NhwcConv_57_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4014080 - ], - "size_in_bytes": 4014080, - "op_tensor_size": 4014080, - "offset": 753040576, - "file_name": ".cache/NhwcConv_0-conv_inConv_295.const", - "file_size": 4014080 - }, - "GroupNorm_38_wts_6_2_8": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 757054656, - "file_name": ".cache/NhwcConv_0-conv_inConv_296.const", - "file_size": 5120 - }, - "NhwcConv_58_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 757059776, - "file_name": ".cache/NhwcConv_0-conv_inConv_297.const", - "file_size": 2007040 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 759066816, - "file_name": ".cache/NhwcConv_0-conv_inConv_298.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 759069376, - "file_name": ".cache/NhwcConv_0-conv_inConv_299.const", - "file_size": 2560 - }, - "Attention_8_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 759071936, - "file_name": ".cache/NhwcConv_0-conv_inConv_300.const", - "file_size": 1868800 - }, - "Attention_8_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 760940736, - "file_name": ".cache/NhwcConv_0-conv_inConv_301.const", - "file_size": 1868800 - }, - "Attention_8_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 762809536, - "file_name": ".cache/NhwcConv_0-conv_inConv_302.const", - "file_size": 1868800 - }, - "onnx::MatMul_5923_11_0_32": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 764678336, - "file_name": ".cache/NhwcConv_0-conv_inConv_303.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 766547136, - "file_name": ".cache/NhwcConv_0-conv_inConv_304.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 766549696, - "file_name": ".cache/NhwcConv_0-conv_inConv_305.const", - "file_size": 2560 - }, - "onnx::MatMul_5924": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 766552256, - "file_name": ".cache/NhwcConv_0-conv_inConv_306.const", - "file_size": 1868800 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24.wts9_24": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 768421056, - "file_name": ".cache/NhwcConv_0-conv_inConv_307.const", - "file_size": 128 - }, - "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts9_140": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 768421184, - "file_name": ".cache/NhwcConv_0-conv_inConv_308.const", - "file_size": 128 - }, - "onnx::MatMul_5934_11_0_33": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 768421312, - "file_name": ".cache/NhwcConv_0-conv_inConv_309.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 770290112, - "file_name": ".cache/NhwcConv_0-conv_inConv_310.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 770292672, - "file_name": ".cache/NhwcConv_0-conv_inConv_311.const", - "file_size": 2560 - }, - "onnx::MatMul_5935_11_0_34_12_8_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 770295232, - "file_name": ".cache/NhwcConv_0-conv_inConv_312.const", - "file_size": 7475200 - }, - "onnx::MatMul_5935_11_0_34_12_8_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 777770432, - "file_name": ".cache/NhwcConv_0-conv_inConv_313.const", - "file_size": 7475200 - }, - "onnx::MatMul_5936_11_0_35": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 785245632, - "file_name": ".cache/NhwcConv_0-conv_inConv_314.const", - "file_size": 7475200 - }, - "NhwcConv_59_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 792720832, - "file_name": ".cache/NhwcConv_0-conv_inConv_315.const", - "file_size": 2007040 - }, - "GroupNorm_39_wts_6_0_30": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 3840 - ], - "size_in_bytes": 7680, - "op_tensor_size": 7680, - "offset": 794727872, - "file_name": ".cache/NhwcConv_0-conv_inConv_316.const", - "file_size": 7680 - }, - "NhwcConv_60_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 25374720 - ], - "size_in_bytes": 25374720, - "op_tensor_size": 25374720, - "offset": 794735552, - "file_name": ".cache/NhwcConv_0-conv_inConv_317.const", - "file_size": 25374720 - }, - "GroupNorm_40_wts_6_0_31": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 820110272, - "file_name": ".cache/NhwcConv_0-conv_inConv_318.const", - "file_size": 5120 - }, - "NhwcConv_61_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 16916480 - ], - "size_in_bytes": 16916480, - "op_tensor_size": 16916480, - "offset": 820115392, - "file_name": ".cache/NhwcConv_0-conv_inConv_319.const", - "file_size": 16916480 - }, - "NhwcConv_62_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 3010560 - ], - "size_in_bytes": 3010560, - "op_tensor_size": 3010560, - "offset": 837031872, - "file_name": ".cache/NhwcConv_0-conv_inConv_320.const", - "file_size": 3010560 - }, - "GroupNorm_41_wts_6_2_9": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 840042432, - "file_name": ".cache/NhwcConv_0-conv_inConv_321.const", - "file_size": 5120 - }, - "NhwcConv_63_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 840047552, - "file_name": ".cache/NhwcConv_0-conv_inConv_322.const", - "file_size": 2007040 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 842054592, - "file_name": ".cache/NhwcConv_0-conv_inConv_323.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 842057152, - "file_name": ".cache/NhwcConv_0-conv_inConv_324.const", - "file_size": 2560 - }, - "Attention_9_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 842059712, - "file_name": ".cache/NhwcConv_0-conv_inConv_325.const", - "file_size": 1868800 - }, - "Attention_9_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 843928512, - "file_name": ".cache/NhwcConv_0-conv_inConv_326.const", - "file_size": 1868800 - }, - "Attention_9_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 845797312, - "file_name": ".cache/NhwcConv_0-conv_inConv_327.const", - "file_size": 1868800 - }, - "onnx::MatMul_5953_11_0_36": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 847666112, - "file_name": ".cache/NhwcConv_0-conv_inConv_328.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 849534912, - "file_name": ".cache/NhwcConv_0-conv_inConv_329.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 849537472, - "file_name": ".cache/NhwcConv_0-conv_inConv_330.const", - "file_size": 2560 - }, - "onnx::MatMul_5954": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 849540032, - "file_name": ".cache/NhwcConv_0-conv_inConv_331.const", - "file_size": 1868800 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27.wts9_27": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 851408832, - "file_name": ".cache/NhwcConv_0-conv_inConv_332.const", - "file_size": 128 - }, - "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts9_148": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 851408960, - "file_name": ".cache/NhwcConv_0-conv_inConv_333.const", - "file_size": 128 - }, - "onnx::MatMul_5964_11_0_37": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 851409088, - "file_name": ".cache/NhwcConv_0-conv_inConv_334.const", - "file_size": 1868800 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 853277888, - "file_name": ".cache/NhwcConv_0-conv_inConv_335.const", - "file_size": 2560 - }, - "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 853280448, - "file_name": ".cache/NhwcConv_0-conv_inConv_336.const", - "file_size": 2560 - }, - "onnx::MatMul_5965_11_0_38_12_9_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 853283008, - "file_name": ".cache/NhwcConv_0-conv_inConv_337.const", - "file_size": 7475200 - }, - "onnx::MatMul_5965_11_0_38_12_9_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 860758208, - "file_name": ".cache/NhwcConv_0-conv_inConv_338.const", - "file_size": 7475200 - }, - "onnx::MatMul_5966_11_0_39": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 7475200 - ], - "size_in_bytes": 7475200, - "op_tensor_size": 7475200, - "offset": 868233408, - "file_name": ".cache/NhwcConv_0-conv_inConv_339.const", - "file_size": 7475200 - }, - "NhwcConv_64_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2007040 - ], - "size_in_bytes": 2007040, - "op_tensor_size": 2007040, - "offset": 875708608, - "file_name": ".cache/NhwcConv_0-conv_inConv_340.const", - "file_size": 2007040 - }, - "/up_blocks.1/upsamplers.0/Resize.weights3_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 128 - ], - "size_in_bytes": 256, - "op_tensor_size": 256, - "offset": 877715648, - "file_name": ".cache/NhwcConv_0-conv_inConv_341.const", - "file_size": 256 - }, - "NhwcConv_65_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 17244160 - ], - "size_in_bytes": 17244160, - "op_tensor_size": 17244160, - "offset": 877715904, - "file_name": ".cache/NhwcConv_0-conv_inConv_342.const", - "file_size": 17244160 - }, - "GroupNorm_42_wts_6_0_32": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 3840 - ], - "size_in_bytes": 7680, - "op_tensor_size": 7680, - "offset": 894960064, - "file_name": ".cache/NhwcConv_0-conv_inConv_343.const", - "file_size": 7680 - }, - "NhwcConv_66_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 12851200 - ], - "size_in_bytes": 12851200, - "op_tensor_size": 12851200, - "offset": 894967744, - "file_name": ".cache/NhwcConv_0-conv_inConv_344.const", - "file_size": 12851200 - }, - "GroupNorm_43_wts_6_0_33": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 907818944, - "file_name": ".cache/NhwcConv_0-conv_inConv_345.const", - "file_size": 2560 - }, - "NhwcConv_67_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 907821504, - "file_name": ".cache/NhwcConv_0-conv_inConv_346.const", - "file_size": 4311040 - }, - "NhwcConv_68_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1505280 - ], - "size_in_bytes": 1505280, - "op_tensor_size": 1505280, - "offset": 912132544, - "file_name": ".cache/NhwcConv_0-conv_inConv_347.const", - "file_size": 1505280 - }, - "GroupNorm_44_wts_6_2_10": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 913637824, - "file_name": ".cache/NhwcConv_0-conv_inConv_348.const", - "file_size": 2560 - }, - "NhwcConv_69_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 913640384, - "file_name": ".cache/NhwcConv_0-conv_inConv_349.const", - "file_size": 501760 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 914142144, - "file_name": ".cache/NhwcConv_0-conv_inConv_350.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 914143424, - "file_name": ".cache/NhwcConv_0-conv_inConv_351.const", - "file_size": 1280 - }, - "Attention_10_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 914144704, - "file_name": ".cache/NhwcConv_0-conv_inConv_352.const", - "file_size": 471040 - }, - "Attention_10_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 914615744, - "file_name": ".cache/NhwcConv_0-conv_inConv_353.const", - "file_size": 471040 - }, - "Attention_10_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 915086784, - "file_name": ".cache/NhwcConv_0-conv_inConv_354.const", - "file_size": 471040 - }, - "onnx::MatMul_5984_11_0_40": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 915557824, - "file_name": ".cache/NhwcConv_0-conv_inConv_355.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 916031424, - "file_name": ".cache/NhwcConv_0-conv_inConv_356.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 916032704, - "file_name": ".cache/NhwcConv_0-conv_inConv_357.const", - "file_size": 1280 - }, - "onnx::MatMul_5985": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 916033984, - "file_name": ".cache/NhwcConv_0-conv_inConv_358.const", - "file_size": 471040 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30.wts9_30": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 916505024, - "file_name": ".cache/NhwcConv_0-conv_inConv_359.const", - "file_size": 128 - }, - "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts9_156": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 916505152, - "file_name": ".cache/NhwcConv_0-conv_inConv_360.const", - "file_size": 128 - }, - "onnx::MatMul_5995_11_0_41": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 916505280, - "file_name": ".cache/NhwcConv_0-conv_inConv_361.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 916978880, - "file_name": ".cache/NhwcConv_0-conv_inConv_362.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 916980160, - "file_name": ".cache/NhwcConv_0-conv_inConv_363.const", - "file_size": 1280 - }, - "onnx::MatMul_5996_11_0_42_12_10_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 916981440, - "file_name": ".cache/NhwcConv_0-conv_inConv_364.const", - "file_size": 1868800 - }, - "onnx::MatMul_5996_11_0_42_12_10_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 918850240, - "file_name": ".cache/NhwcConv_0-conv_inConv_365.const", - "file_size": 1868800 - }, - "onnx::MatMul_5997_11_0_43": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1884160 - ], - "size_in_bytes": 1884160, - "op_tensor_size": 1884160, - "offset": 920719040, - "file_name": ".cache/NhwcConv_0-conv_inConv_366.const", - "file_size": 1884160 - }, - "NhwcConv_70_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 922603200, - "file_name": ".cache/NhwcConv_0-conv_inConv_367.const", - "file_size": 501760 - }, - "GroupNorm_45_wts_6_0_34": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 2560 - ], - "size_in_bytes": 5120, - "op_tensor_size": 5120, - "offset": 923104960, - "file_name": ".cache/NhwcConv_0-conv_inConv_368.const", - "file_size": 5120 - }, - "NhwcConv_71_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 8622080 - ], - "size_in_bytes": 8622080, - "op_tensor_size": 8622080, - "offset": 923110080, - "file_name": ".cache/NhwcConv_0-conv_inConv_369.const", - "file_size": 8622080 - }, - "GroupNorm_46_wts_6_0_35": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 931732160, - "file_name": ".cache/NhwcConv_0-conv_inConv_370.const", - "file_size": 2560 - }, - "NhwcConv_72_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 931734720, - "file_name": ".cache/NhwcConv_0-conv_inConv_371.const", - "file_size": 4311040 - }, - "NhwcConv_73_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1003520 - ], - "size_in_bytes": 1003520, - "op_tensor_size": 1003520, - "offset": 936045760, - "file_name": ".cache/NhwcConv_0-conv_inConv_372.const", - "file_size": 1003520 - }, - "GroupNorm_47_wts_6_2_11": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 937049280, - "file_name": ".cache/NhwcConv_0-conv_inConv_373.const", - "file_size": 2560 - }, - "NhwcConv_74_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 937051840, - "file_name": ".cache/NhwcConv_0-conv_inConv_374.const", - "file_size": 501760 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 937553600, - "file_name": ".cache/NhwcConv_0-conv_inConv_375.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 937554880, - "file_name": ".cache/NhwcConv_0-conv_inConv_376.const", - "file_size": 1280 - }, - "Attention_11_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 937556160, - "file_name": ".cache/NhwcConv_0-conv_inConv_377.const", - "file_size": 471040 - }, - "Attention_11_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 938027200, - "file_name": ".cache/NhwcConv_0-conv_inConv_378.const", - "file_size": 471040 - }, - "Attention_11_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 938498240, - "file_name": ".cache/NhwcConv_0-conv_inConv_379.const", - "file_size": 471040 - }, - "onnx::MatMul_6014_11_0_44": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 938969280, - "file_name": ".cache/NhwcConv_0-conv_inConv_380.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 939442880, - "file_name": ".cache/NhwcConv_0-conv_inConv_381.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 939444160, - "file_name": ".cache/NhwcConv_0-conv_inConv_382.const", - "file_size": 1280 - }, - "onnx::MatMul_6015": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 939445440, - "file_name": ".cache/NhwcConv_0-conv_inConv_383.const", - "file_size": 471040 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33.wts9_33": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 939916480, - "file_name": ".cache/NhwcConv_0-conv_inConv_384.const", - "file_size": 128 - }, - "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts9_164": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 939916608, - "file_name": ".cache/NhwcConv_0-conv_inConv_385.const", - "file_size": 128 - }, - "onnx::MatMul_6025_11_0_45": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 939916736, - "file_name": ".cache/NhwcConv_0-conv_inConv_386.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 940390336, - "file_name": ".cache/NhwcConv_0-conv_inConv_387.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 940391616, - "file_name": ".cache/NhwcConv_0-conv_inConv_388.const", - "file_size": 1280 - }, - "onnx::MatMul_6026_11_0_46_12_11_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 940392896, - "file_name": ".cache/NhwcConv_0-conv_inConv_389.const", - "file_size": 1868800 - }, - "onnx::MatMul_6026_11_0_46_12_11_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 942261696, - "file_name": ".cache/NhwcConv_0-conv_inConv_390.const", - "file_size": 1868800 - }, - "onnx::MatMul_6027_11_0_47": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1884160 - ], - "size_in_bytes": 1884160, - "op_tensor_size": 1884160, - "offset": 944130496, - "file_name": ".cache/NhwcConv_0-conv_inConv_391.const", - "file_size": 1884160 - }, - "NhwcConv_75_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 946014656, - "file_name": ".cache/NhwcConv_0-conv_inConv_392.const", - "file_size": 501760 - }, - "GroupNorm_48_wts_6_0_36": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1920 - ], - "size_in_bytes": 3840, - "op_tensor_size": 3840, - "offset": 946516416, - "file_name": ".cache/NhwcConv_0-conv_inConv_393.const", - "file_size": 3840 - }, - "NhwcConv_76_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 6425600 - ], - "size_in_bytes": 6425600, - "op_tensor_size": 6425600, - "offset": 946520256, - "file_name": ".cache/NhwcConv_0-conv_inConv_394.const", - "file_size": 6425600 - }, - "GroupNorm_49_wts_6_0_37": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 952945856, - "file_name": ".cache/NhwcConv_0-conv_inConv_395.const", - "file_size": 2560 - }, - "NhwcConv_77_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 952948416, - "file_name": ".cache/NhwcConv_0-conv_inConv_396.const", - "file_size": 4311040 - }, - "NhwcConv_78_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 752640 - ], - "size_in_bytes": 752640, - "op_tensor_size": 752640, - "offset": 957259456, - "file_name": ".cache/NhwcConv_0-conv_inConv_397.const", - "file_size": 752640 - }, - "GroupNorm_50_wts_6_2_12": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 958012096, - "file_name": ".cache/NhwcConv_0-conv_inConv_398.const", - "file_size": 2560 - }, - "NhwcConv_79_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 958014656, - "file_name": ".cache/NhwcConv_0-conv_inConv_399.const", - "file_size": 501760 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 958516416, - "file_name": ".cache/NhwcConv_0-conv_inConv_400.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 958517696, - "file_name": ".cache/NhwcConv_0-conv_inConv_401.const", - "file_size": 1280 - }, - "Attention_12_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 958518976, - "file_name": ".cache/NhwcConv_0-conv_inConv_402.const", - "file_size": 471040 - }, - "Attention_12_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 958990016, - "file_name": ".cache/NhwcConv_0-conv_inConv_403.const", - "file_size": 471040 - }, - "Attention_12_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 959461056, - "file_name": ".cache/NhwcConv_0-conv_inConv_404.const", - "file_size": 471040 - }, - "onnx::MatMul_6044_11_0_48": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 959932096, - "file_name": ".cache/NhwcConv_0-conv_inConv_405.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 960405696, - "file_name": ".cache/NhwcConv_0-conv_inConv_406.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 960406976, - "file_name": ".cache/NhwcConv_0-conv_inConv_407.const", - "file_size": 1280 - }, - "onnx::MatMul_6045": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 960408256, - "file_name": ".cache/NhwcConv_0-conv_inConv_408.const", - "file_size": 471040 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36.wts9_36": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 960879296, - "file_name": ".cache/NhwcConv_0-conv_inConv_409.const", - "file_size": 128 - }, - "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts9_172": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 960879424, - "file_name": ".cache/NhwcConv_0-conv_inConv_410.const", - "file_size": 128 - }, - "onnx::MatMul_6055_11_0_49": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 473600 - ], - "size_in_bytes": 473600, - "op_tensor_size": 473600, - "offset": 960879552, - "file_name": ".cache/NhwcConv_0-conv_inConv_411.const", - "file_size": 473600 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 961353152, - "file_name": ".cache/NhwcConv_0-conv_inConv_412.const", - "file_size": 1280 - }, - "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 961354432, - "file_name": ".cache/NhwcConv_0-conv_inConv_413.const", - "file_size": 1280 - }, - "onnx::MatMul_6056_11_0_50_12_12_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 961355712, - "file_name": ".cache/NhwcConv_0-conv_inConv_414.const", - "file_size": 1868800 - }, - "onnx::MatMul_6056_11_0_50_12_12_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1868800 - ], - "size_in_bytes": 1868800, - "op_tensor_size": 1868800, - "offset": 963224512, - "file_name": ".cache/NhwcConv_0-conv_inConv_415.const", - "file_size": 1868800 - }, - "onnx::MatMul_6057_11_0_51": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1884160 - ], - "size_in_bytes": 1884160, - "op_tensor_size": 1884160, - "offset": 965093312, - "file_name": ".cache/NhwcConv_0-conv_inConv_416.const", - "file_size": 1884160 - }, - "NhwcConv_80_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 501760 - ], - "size_in_bytes": 501760, - "op_tensor_size": 501760, - "offset": 966977472, - "file_name": ".cache/NhwcConv_0-conv_inConv_417.const", - "file_size": 501760 - }, - "/up_blocks.2/upsamplers.0/Resize.weights3_2": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 128 - ], - "size_in_bytes": 256, - "op_tensor_size": 256, - "offset": 967479232, - "file_name": ".cache/NhwcConv_0-conv_inConv_418.const", - "file_size": 256 - }, - "NhwcConv_81_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 4311040 - ], - "size_in_bytes": 4311040, - "op_tensor_size": 4311040, - "offset": 967479488, - "file_name": ".cache/NhwcConv_0-conv_inConv_419.const", - "file_size": 4311040 - }, - "GroupNorm_51_wts_6_0_38": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1920 - ], - "size_in_bytes": 3840, - "op_tensor_size": 3840, - "offset": 971790528, - "file_name": ".cache/NhwcConv_0-conv_inConv_420.const", - "file_size": 3840 - }, - "NhwcConv_82_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 3212800 - ], - "size_in_bytes": 3212800, - "op_tensor_size": 3212800, - "offset": 971794368, - "file_name": ".cache/NhwcConv_0-conv_inConv_421.const", - "file_size": 3212800 - }, - "GroupNorm_52_wts_6_0_39": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 975007168, - "file_name": ".cache/NhwcConv_0-conv_inConv_422.const", - "file_size": 1280 - }, - "NhwcConv_83_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 975008448, - "file_name": ".cache/NhwcConv_0-conv_inConv_423.const", - "file_size": 1077760 - }, - "NhwcConv_84_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 376320 - ], - "size_in_bytes": 376320, - "op_tensor_size": 376320, - "offset": 976086208, - "file_name": ".cache/NhwcConv_0-conv_inConv_424.const", - "file_size": 376320 - }, - "GroupNorm_53_wts_6_2_13": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 976462528, - "file_name": ".cache/NhwcConv_0-conv_inConv_425.const", - "file_size": 1280 - }, - "NhwcConv_85_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 976463808, - "file_name": ".cache/NhwcConv_0-conv_inConv_426.const", - "file_size": 125440 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 976589248, - "file_name": ".cache/NhwcConv_0-conv_inConv_427.const", - "file_size": 640 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 976589888, - "file_name": ".cache/NhwcConv_0-conv_inConv_428.const", - "file_size": 640 - }, - "Attention_13_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 976590528, - "file_name": ".cache/NhwcConv_0-conv_inConv_429.const", - "file_size": 118400 - }, - "Attention_13_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 976708928, - "file_name": ".cache/NhwcConv_0-conv_inConv_430.const", - "file_size": 118400 - }, - "Attention_13_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 976827328, - "file_name": ".cache/NhwcConv_0-conv_inConv_431.const", - "file_size": 118400 - }, - "onnx::MatMul_6075_11_0_52": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 976945728, - "file_name": ".cache/NhwcConv_0-conv_inConv_432.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 977063488, - "file_name": ".cache/NhwcConv_0-conv_inConv_433.const", - "file_size": 640 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 977064128, - "file_name": ".cache/NhwcConv_0-conv_inConv_434.const", - "file_size": 640 - }, - "onnx::MatMul_6076": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 977064768, - "file_name": ".cache/NhwcConv_0-conv_inConv_435.const", - "file_size": 118400 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39.wts9_39": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 977183168, - "file_name": ".cache/NhwcConv_0-conv_inConv_436.const", - "file_size": 128 - }, - "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts9_180": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 977183296, - "file_name": ".cache/NhwcConv_0-conv_inConv_437.const", - "file_size": 128 - }, - "onnx::MatMul_6086_11_0_53": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 977183424, - "file_name": ".cache/NhwcConv_0-conv_inConv_438.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 977301184, - "file_name": ".cache/NhwcConv_0-conv_inConv_439.const", - "file_size": 640 - }, - "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 977301824, - "file_name": ".cache/NhwcConv_0-conv_inConv_440.const", - "file_size": 640 - }, - "onnx::MatMul_6087_11_0_54_12_13_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 977302464, - "file_name": ".cache/NhwcConv_0-conv_inConv_441.const", - "file_size": 471040 - }, - "onnx::MatMul_6087_11_0_54_12_13_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 977773504, - "file_name": ".cache/NhwcConv_0-conv_inConv_442.const", - "file_size": 471040 - }, - "onnx::MatMul_6088_11_0_55": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 978244544, - "file_name": ".cache/NhwcConv_0-conv_inConv_443.const", - "file_size": 471040 - }, - "NhwcConv_86_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 978715584, - "file_name": ".cache/NhwcConv_0-conv_inConv_444.const", - "file_size": 125440 - }, - "GroupNorm_54_wts_6_0_40": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 978841024, - "file_name": ".cache/NhwcConv_0-conv_inConv_445.const", - "file_size": 2560 - }, - "NhwcConv_87_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2155520 - ], - "size_in_bytes": 2155520, - "op_tensor_size": 2155520, - "offset": 978843584, - "file_name": ".cache/NhwcConv_0-conv_inConv_446.const", - "file_size": 2155520 - }, - "GroupNorm_55_wts_6_0_41": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 980999104, - "file_name": ".cache/NhwcConv_0-conv_inConv_447.const", - "file_size": 1280 - }, - "NhwcConv_88_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 981000384, - "file_name": ".cache/NhwcConv_0-conv_inConv_448.const", - "file_size": 1077760 - }, - "NhwcConv_89_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 250880 - ], - "size_in_bytes": 250880, - "op_tensor_size": 250880, - "offset": 982078144, - "file_name": ".cache/NhwcConv_0-conv_inConv_449.const", - "file_size": 250880 - }, - "GroupNorm_56_wts_6_2_14": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 982329024, - "file_name": ".cache/NhwcConv_0-conv_inConv_450.const", - "file_size": 1280 - }, - "NhwcConv_90_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 982330304, - "file_name": ".cache/NhwcConv_0-conv_inConv_451.const", - "file_size": 125440 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 982455744, - "file_name": ".cache/NhwcConv_0-conv_inConv_452.const", - "file_size": 640 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 982456384, - "file_name": ".cache/NhwcConv_0-conv_inConv_453.const", - "file_size": 640 - }, - "Attention_14_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 982457024, - "file_name": ".cache/NhwcConv_0-conv_inConv_454.const", - "file_size": 118400 - }, - "Attention_14_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 982575424, - "file_name": ".cache/NhwcConv_0-conv_inConv_455.const", - "file_size": 118400 - }, - "Attention_14_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 982693824, - "file_name": ".cache/NhwcConv_0-conv_inConv_456.const", - "file_size": 118400 - }, - "onnx::MatMul_6105_11_0_56": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 982812224, - "file_name": ".cache/NhwcConv_0-conv_inConv_457.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 982929984, - "file_name": ".cache/NhwcConv_0-conv_inConv_458.const", - "file_size": 640 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 982930624, - "file_name": ".cache/NhwcConv_0-conv_inConv_459.const", - "file_size": 640 - }, - "onnx::MatMul_6106": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 982931264, - "file_name": ".cache/NhwcConv_0-conv_inConv_460.const", - "file_size": 118400 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42.wts9_42": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 983049664, - "file_name": ".cache/NhwcConv_0-conv_inConv_461.const", - "file_size": 128 - }, - "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts9_188": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 983049792, - "file_name": ".cache/NhwcConv_0-conv_inConv_462.const", - "file_size": 128 - }, - "onnx::MatMul_6116_11_0_57": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 983049920, - "file_name": ".cache/NhwcConv_0-conv_inConv_463.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 983167680, - "file_name": ".cache/NhwcConv_0-conv_inConv_464.const", - "file_size": 640 - }, - "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 983168320, - "file_name": ".cache/NhwcConv_0-conv_inConv_465.const", - "file_size": 640 - }, - "onnx::MatMul_6117_11_0_58_12_14_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 983168960, - "file_name": ".cache/NhwcConv_0-conv_inConv_466.const", - "file_size": 471040 - }, - "onnx::MatMul_6117_11_0_58_12_14_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 983640000, - "file_name": ".cache/NhwcConv_0-conv_inConv_467.const", - "file_size": 471040 - }, - "onnx::MatMul_6118_11_0_59": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 984111040, - "file_name": ".cache/NhwcConv_0-conv_inConv_468.const", - "file_size": 471040 - }, - "NhwcConv_91_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 984582080, - "file_name": ".cache/NhwcConv_0-conv_inConv_469.const", - "file_size": 125440 - }, - "GroupNorm_57_wts_6_0_42": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 1280 - ], - "size_in_bytes": 2560, - "op_tensor_size": 2560, - "offset": 984707520, - "file_name": ".cache/NhwcConv_0-conv_inConv_470.const", - "file_size": 2560 - }, - "NhwcConv_92_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 2155520 - ], - "size_in_bytes": 2155520, - "op_tensor_size": 2155520, - "offset": 984710080, - "file_name": ".cache/NhwcConv_0-conv_inConv_471.const", - "file_size": 2155520 - }, - "GroupNorm_58_wts_6_0_43": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 986865600, - "file_name": ".cache/NhwcConv_0-conv_inConv_472.const", - "file_size": 1280 - }, - "NhwcConv_93_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 1077760 - ], - "size_in_bytes": 1077760, - "op_tensor_size": 1077760, - "offset": 986866880, - "file_name": ".cache/NhwcConv_0-conv_inConv_473.const", - "file_size": 1077760 - }, - "NhwcConv_94_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 250880 - ], - "size_in_bytes": 250880, - "op_tensor_size": 250880, - "offset": 987944640, - "file_name": ".cache/NhwcConv_0-conv_inConv_474.const", - "file_size": 250880 - }, - "GroupNorm_59_wts_6_2_15": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 988195520, - "file_name": ".cache/NhwcConv_0-conv_inConv_475.const", - "file_size": 1280 - }, - "NhwcConv_95_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 988196800, - "file_name": ".cache/NhwcConv_0-conv_inConv_476.const", - "file_size": 125440 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 988322240, - "file_name": ".cache/NhwcConv_0-conv_inConv_477.const", - "file_size": 640 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 988322880, - "file_name": ".cache/NhwcConv_0-conv_inConv_478.const", - "file_size": 640 - }, - "Attention_15_qkv_weight_key": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 988323520, - "file_name": ".cache/NhwcConv_0-conv_inConv_479.const", - "file_size": 118400 - }, - "Attention_15_qkv_weight_query": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 988441920, - "file_name": ".cache/NhwcConv_0-conv_inConv_480.const", - "file_size": 118400 - }, - "Attention_15_qkv_weight_value": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 988560320, - "file_name": ".cache/NhwcConv_0-conv_inConv_481.const", - "file_size": 118400 - }, - "onnx::MatMul_6135_11_0_60": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 988678720, - "file_name": ".cache/NhwcConv_0-conv_inConv_482.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 988796480, - "file_name": ".cache/NhwcConv_0-conv_inConv_483.const", - "file_size": 640 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 988797120, - "file_name": ".cache/NhwcConv_0-conv_inConv_484.const", - "file_size": 640 - }, - "onnx::MatMul_6136": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 118400 - ], - "size_in_bytes": 118400, - "op_tensor_size": 118400, - "offset": 988797760, - "file_name": ".cache/NhwcConv_0-conv_inConv_485.const", - "file_size": 118400 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45.wts9_45": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 988916160, - "file_name": ".cache/NhwcConv_0-conv_inConv_486.const", - "file_size": 128 - }, - "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts9_196": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 988916288, - "file_name": ".cache/NhwcConv_0-conv_inConv_487.const", - "file_size": 128 - }, - "onnx::MatMul_6146_11_0_61": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 117760 - ], - "size_in_bytes": 117760, - "op_tensor_size": 117760, - "offset": 988916416, - "file_name": ".cache/NhwcConv_0-conv_inConv_488.const", - "file_size": 117760 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 989034176, - "file_name": ".cache/NhwcConv_0-conv_inConv_489.const", - "file_size": 640 - }, - "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 320 - ], - "size_in_bytes": 640, - "op_tensor_size": 640, - "offset": 989034816, - "file_name": ".cache/NhwcConv_0-conv_inConv_490.const", - "file_size": 640 - }, - "onnx::MatMul_6147_11_0_62_12_15_0": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 989035456, - "file_name": ".cache/NhwcConv_0-conv_inConv_491.const", - "file_size": 471040 - }, - "onnx::MatMul_6147_11_0_62_12_15_1": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 989506496, - "file_name": ".cache/NhwcConv_0-conv_inConv_492.const", - "file_size": 471040 - }, - "onnx::MatMul_6148_11_0_63": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 471040 - ], - "size_in_bytes": 471040, - "op_tensor_size": 471040, - "offset": 989977536, - "file_name": ".cache/NhwcConv_0-conv_inConv_493.const", - "file_size": 471040 - }, - "NhwcConv_96_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 125440 - ], - "size_in_bytes": 125440, - "op_tensor_size": 125440, - "offset": 990448576, - "file_name": ".cache/NhwcConv_0-conv_inConv_494.const", - "file_size": 125440 - }, - "GroupNorm_60_wts_6_0_44": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 640 - ], - "size_in_bytes": 1280, - "op_tensor_size": 1280, - "offset": 990574016, - "file_name": ".cache/NhwcConv_0-conv_inConv_495.const", - "file_size": 1280 - }, - "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts7_60": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfloat16", - "shape": [ - 64 - ], - "size_in_bytes": 128, - "op_tensor_size": 128, - "offset": 990575296, - "file_name": ".cache/NhwcConv_0-conv_inConv_496.const", - "file_size": 128 - }, - "NhwcConv_97_weight_NHWC": { - "packed_buffer_label": "const", - "xrt_arg_id": 3, - "dtype": "bfp16ebs8", - "shape": [ - 54400 - ], - "size_in_bytes": 54400, - "op_tensor_size": 54400, - "offset": 990575424, - "file_name": ".cache/NhwcConv_0-conv_inConv_497.const", - "file_size": 54400 - } - }, - "aux_info": {} +{ + "dd_meta_major_version": 1, + "dd_meta_minor_version": 4, + "state_table_updates": [], + "op_list": [ + { + "name": "NhwcConv_0-/conv_in/Conv", + "type": "SDConv", + "in_args": [ + "Transpose_44_out-sample.out0_1_0" + ], + "const_args": [ + "NhwcConv_0_weight_NHWC" + ], + "out_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "4" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "4" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0" + ], + "const_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts" + ], + "out_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_0", + "type": "SDGroupNorm_bfp", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" + ], + "const_args": [ + "GroupNorm_0_wts_6_0_0" + ], + "out_args": [ + "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5660" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5661" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5690" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5691" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5720" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5721" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5750" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5751" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5780" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5781" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5810" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5811" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5848" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5849" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/linear_1/Gemm", + "type": "SDGemm", + "in_args": [ + "/time_proj/Concat_1_output_0.out2_3_0" + ], + "const_args": [ + "time_embedding.linear_1.weight_11_1_0" + ], + "out_args": [ + "/time_embedding/linear_1/Gemm_output_0.out2_3_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid", + "type": "SDSilu", + "in_args": [ + "/time_embedding/linear_1/Gemm_output_0.out2_3_0" + ], + "const_args": [ + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0" + ], + "out_args": [ + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/time_embedding/linear_2/Gemm", + "type": "SDGemm", + "in_args": [ + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0" + ], + "const_args": [ + "time_embedding.linear_2.weight_11_1_1" + ], + "out_args": [ + "/time_embedding/linear_2/Gemm_output_0.out2_3_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid", + "type": "SDSilu", + "in_args": [ + "/time_embedding/linear_2/Gemm_output_0.out2_3_1" + ], + "const_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1" + ], + "out_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2" + ], + "out_args": [ + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_1-/down_blocks.0/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0" + ], + "const_args": [ + "NhwcConv_1_weight_NHWC" + ], + "out_args": [ + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1", + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_1", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0" + ], + "const_args": [ + "GroupNorm_1_wts_6_0_1" + ], + "out_args": [ + "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_2-/down_blocks.0/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1" + ], + "const_args": [ + "NhwcConv_2_weight_NHWC" + ], + "out_args": [ + "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0", + "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_2", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" + ], + "const_args": [ + "GroupNorm_2_wts_6_2_0" + ], + "out_args": [ + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_3-/down_blocks.0/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2" + ], + "const_args": [ + "NhwcConv_3_weight_NHWC" + ], + "out_args": [ + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" + ], + "const_args": [ + "Attention_0_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" + ], + "const_args": [ + "Attention_0_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0" + ], + "const_args": [ + "Attention_0_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_0", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_0_0" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "4096" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_0_0" + ], + "const_args": [ + "onnx::MatMul_5658_11_0_0" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75", + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1" + ], + "const_args": [ + "onnx::MatMul_5659" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0" + ], + "const_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0_bfp.wts" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_0", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1" + ], + "const_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76" + ], + "const_args": [ + "onnx::MatMul_5669_11_0_1" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" + ], + "const_args": [ + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_0_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" + ], + "const_args": [ + "onnx::MatMul_5670_11_0_2_12_0_0" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_0_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2" + ], + "const_args": [ + "onnx::MatMul_5670_11_0_2_12_0_1" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0" + ], + "const_args": [ + "onnx::MatMul_5671_11_0_3" + ], + "out_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_4-/down_blocks.0/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4" + ], + "const_args": [ + "NhwcConv_4_weight_NHWC" + ], + "out_args": [ + "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4", + "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_3", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" + ], + "const_args": [ + "GroupNorm_3_wts_6_0_2" + ], + "out_args": [ + "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3" + ], + "out_args": [ + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_5-/down_blocks.0/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3" + ], + "const_args": [ + "NhwcConv_5_weight_NHWC" + ], + "out_args": [ + "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5", + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_4", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6" + ], + "const_args": [ + "GroupNorm_4_wts_6_0_3" + ], + "out_args": [ + "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_6-/down_blocks.0/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4" + ], + "const_args": [ + "NhwcConv_6_weight_NHWC" + ], + "out_args": [ + "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5", + "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_5", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" + ], + "const_args": [ + "GroupNorm_5_wts_6_2_1" + ], + "out_args": [ + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_7-/down_blocks.0/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5" + ], + "const_args": [ + "NhwcConv_7_weight_NHWC" + ], + "out_args": [ + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" + ], + "const_args": [ + "Attention_1_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" + ], + "const_args": [ + "Attention_1_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3" + ], + "const_args": [ + "Attention_1_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_1", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_0_1" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "4096" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_0_1" + ], + "const_args": [ + "onnx::MatMul_5688_11_0_4" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83", + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4" + ], + "const_args": [ + "onnx::MatMul_5689" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3" + ], + "const_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3_bfp.wts" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_1", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3" + ], + "const_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84" + ], + "const_args": [ + "onnx::MatMul_5699_11_0_5" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" + ], + "const_args": [ + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_1_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" + ], + "const_args": [ + "onnx::MatMul_5700_11_0_6_12_1_0" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_1_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5" + ], + "const_args": [ + "onnx::MatMul_5700_11_0_6_12_1_1" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1" + ], + "const_args": [ + "onnx::MatMul_5701_11_0_7" + ], + "out_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_8-/down_blocks.0/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10" + ], + "const_args": [ + "NhwcConv_8_weight_NHWC" + ], + "out_args": [ + "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.0/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8", + "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7" + ], + "const_args": [], + "out_args": [ + "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_9-/down_blocks.0/downsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" + ], + "const_args": [ + "NhwcConv_9_weight_NHWC" + ], + "out_args": [ + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_6", + "type": "SDGroupNorm_bfp", + "in_args": [ + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" + ], + "const_args": [ + "GroupNorm_6_wts_6_0_4" + ], + "out_args": [ + "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4" + ], + "out_args": [ + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_10-/down_blocks.1/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6" + ], + "const_args": [ + "NhwcConv_10_weight_NHWC" + ], + "out_args": [ + "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11", + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_7", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12" + ], + "const_args": [ + "GroupNorm_7_wts_6_0_5" + ], + "out_args": [ + "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5" + ], + "out_args": [ + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6" + ], + "out_args": [ + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7" + ], + "out_args": [ + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8" + ], + "out_args": [ + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9" + ], + "out_args": [ + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "mid_block.resnets.0.time_emb_proj.weight_11_1_10" + ], + "out_args": [ + "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "mid_block.resnets.1.time_emb_proj.weight_11_1_11" + ], + "out_args": [ + "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12" + ], + "out_args": [ + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13" + ], + "out_args": [ + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14" + ], + "out_args": [ + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5895" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5896" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5925" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5926" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5955" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5956" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15" + ], + "out_args": [ + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16" + ], + "out_args": [ + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17" + ], + "out_args": [ + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5986" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_5987" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6016" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6017" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6046" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6047" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18" + ], + "out_args": [ + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19" + ], + "out_args": [ + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20" + ], + "out_args": [ + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6077" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6078" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6107" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6108" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6137" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "encoder_hidden_states.out2_6_0" + ], + "const_args": [ + "onnx::MatMul_6138" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "77", + "768" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "77", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "768", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21" + ], + "out_args": [ + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22" + ], + "out_args": [ + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/time_emb_proj/Gemm", + "type": "SDGemm", + "in_args": [ + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1" + ], + "const_args": [ + "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23" + ], + "out_args": [ + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_11-/down_blocks.1/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7" + ], + "const_args": [ + "NhwcConv_11_weight_NHWC" + ], + "out_args": [ + "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_12-/down_blocks.1/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" + ], + "const_args": [ + "NhwcConv_12_weight_NHWC" + ], + "out_args": [ + "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10", + "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_8", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" + ], + "const_args": [ + "GroupNorm_8_wts_6_2_2" + ], + "out_args": [ + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_13-/down_blocks.1/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8" + ], + "const_args": [ + "NhwcConv_13_weight_NHWC" + ], + "out_args": [ + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" + ], + "const_args": [ + "Attention_2_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" + ], + "const_args": [ + "Attention_2_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6" + ], + "const_args": [ + "Attention_2_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_2", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_0_2" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "1024" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_0_2" + ], + "const_args": [ + "onnx::MatMul_5718_11_0_8" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91", + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7" + ], + "const_args": [ + "onnx::MatMul_5719" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6" + ], + "const_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6_bfp.wts" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_2", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5" + ], + "const_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92" + ], + "const_args": [ + "onnx::MatMul_5729_11_0_9" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" + ], + "const_args": [ + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_2_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" + ], + "const_args": [ + "onnx::MatMul_5730_11_0_10_12_2_0" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_2_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8" + ], + "const_args": [ + "onnx::MatMul_5730_11_0_10_12_2_1" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2" + ], + "const_args": [ + "onnx::MatMul_5731_11_0_11" + ], + "out_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_14-/down_blocks.1/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16" + ], + "const_args": [ + "NhwcConv_14_weight_NHWC" + ], + "out_args": [ + "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14", + "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_9", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" + ], + "const_args": [ + "GroupNorm_9_wts_6_0_6" + ], + "out_args": [ + "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_15-/down_blocks.1/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9" + ], + "const_args": [ + "NhwcConv_15_weight_NHWC" + ], + "out_args": [ + "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15", + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_10", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18" + ], + "const_args": [ + "GroupNorm_10_wts_6_0_7" + ], + "out_args": [ + "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_16-/down_blocks.1/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10" + ], + "const_args": [ + "NhwcConv_16_weight_NHWC" + ], + "out_args": [ + "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17", + "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_11", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" + ], + "const_args": [ + "GroupNorm_11_wts_6_2_3" + ], + "out_args": [ + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_17-/down_blocks.1/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11" + ], + "const_args": [ + "NhwcConv_17_weight_NHWC" + ], + "out_args": [ + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" + ], + "const_args": [ + "Attention_3_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" + ], + "const_args": [ + "Attention_3_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9" + ], + "const_args": [ + "Attention_3_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_3", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_0_3" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "1024" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_0_3" + ], + "const_args": [ + "onnx::MatMul_5748_11_0_12" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99", + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10" + ], + "const_args": [ + "onnx::MatMul_5749" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9" + ], + "const_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9_bfp.wts" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_3", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7" + ], + "const_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100" + ], + "const_args": [ + "onnx::MatMul_5759_11_0_13" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" + ], + "const_args": [ + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_3_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" + ], + "const_args": [ + "onnx::MatMul_5760_11_0_14_12_3_0" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_3_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11" + ], + "const_args": [ + "onnx::MatMul_5760_11_0_14_12_3_1" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3" + ], + "const_args": [ + "onnx::MatMul_5761_11_0_15" + ], + "out_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_18-/down_blocks.1/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22" + ], + "const_args": [ + "NhwcConv_18_weight_NHWC" + ], + "out_args": [ + "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.1/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18", + "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19" + ], + "const_args": [], + "out_args": [ + "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_19-/down_blocks.1/downsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" + ], + "const_args": [ + "NhwcConv_19_weight_NHWC" + ], + "out_args": [ + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_12", + "type": "SDGroupNorm_bfp", + "in_args": [ + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" + ], + "const_args": [ + "GroupNorm_12_wts_6_0_8" + ], + "out_args": [ + "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_20-/down_blocks.2/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12" + ], + "const_args": [ + "NhwcConv_20_weight_NHWC" + ], + "out_args": [ + "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21", + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_13", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24" + ], + "const_args": [ + "GroupNorm_13_wts_6_0_9" + ], + "out_args": [ + "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_21-/down_blocks.2/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13" + ], + "const_args": [ + "NhwcConv_21_weight_NHWC" + ], + "out_args": [ + "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_22-/down_blocks.2/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" + ], + "const_args": [ + "NhwcConv_22_weight_NHWC" + ], + "out_args": [ + "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20", + "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_14", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" + ], + "const_args": [ + "GroupNorm_14_wts_6_2_4" + ], + "out_args": [ + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_23-/down_blocks.2/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14" + ], + "const_args": [ + "NhwcConv_23_weight_NHWC" + ], + "out_args": [ + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" + ], + "const_args": [ + "Attention_4_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" + ], + "const_args": [ + "Attention_4_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12" + ], + "const_args": [ + "Attention_4_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_4", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_0_4" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "256" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_0_4" + ], + "const_args": [ + "onnx::MatMul_5778_11_0_16" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107", + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13" + ], + "const_args": [ + "onnx::MatMul_5779" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12" + ], + "const_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12_bfp.wts" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_4", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9" + ], + "const_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108" + ], + "const_args": [ + "onnx::MatMul_5789_11_0_17" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" + ], + "const_args": [ + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_4_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" + ], + "const_args": [ + "onnx::MatMul_5790_11_0_18_12_4_0" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_4_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14" + ], + "const_args": [ + "onnx::MatMul_5790_11_0_18_12_4_1" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4" + ], + "const_args": [ + "onnx::MatMul_5791_11_0_19" + ], + "out_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_24-/down_blocks.2/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28" + ], + "const_args": [ + "NhwcConv_24_weight_NHWC" + ], + "out_args": [ + "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24", + "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_15", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" + ], + "const_args": [ + "GroupNorm_15_wts_6_0_10" + ], + "out_args": [ + "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_25-/down_blocks.2/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15" + ], + "const_args": [ + "NhwcConv_25_weight_NHWC" + ], + "out_args": [ + "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25", + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_16", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30" + ], + "const_args": [ + "GroupNorm_16_wts_6_0_11" + ], + "out_args": [ + "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_26-/down_blocks.2/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16" + ], + "const_args": [ + "NhwcConv_26_weight_NHWC" + ], + "out_args": [ + "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29", + "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_17", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" + ], + "const_args": [ + "GroupNorm_17_wts_6_2_5" + ], + "out_args": [ + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_27-/down_blocks.2/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17" + ], + "const_args": [ + "NhwcConv_27_weight_NHWC" + ], + "out_args": [ + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" + ], + "const_args": [ + "Attention_5_qkv_weight_key" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" + ], + "const_args": [ + "Attention_5_qkv_weight_query" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15" + ], + "const_args": [ + "Attention_5_qkv_weight_value" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_5", + "type": "SDMHA_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_0_5" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "256" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_0_5" + ], + "const_args": [ + "onnx::MatMul_5808_11_0_20" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115", + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16" + ], + "const_args": [ + "onnx::MatMul_5809" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15" + ], + "const_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15_bfp.wts" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_5", + "type": "SDFlatMHA", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11" + ], + "const_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116" + ], + "const_args": [ + "onnx::MatMul_5819_11_0_21" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" + ], + "const_args": [ + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_5_0", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" + ], + "const_args": [ + "onnx::MatMul_5820_11_0_22_12_5_0" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_5_1", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17" + ], + "const_args": [ + "onnx::MatMul_5820_11_0_22_12_5_1" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5" + ], + "const_args": [ + "onnx::MatMul_5821_11_0_23" + ], + "out_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_28-/down_blocks.2/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34" + ], + "const_args": [ + "NhwcConv_28_weight_NHWC" + ], + "out_args": [ + "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.2/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28", + "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31" + ], + "const_args": [], + "out_args": [ + "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_29-/down_blocks.2/downsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" + ], + "const_args": [ + "NhwcConv_29_weight_NHWC" + ], + "out_args": [ + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "2", + "2" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_18", + "type": "SDGroupNorm_bfp", + "in_args": [ + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" + ], + "const_args": [ + "GroupNorm_18_wts_6_0_12" + ], + "out_args": [ + "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_30-/down_blocks.3/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18" + ], + "const_args": [ + "NhwcConv_30_weight_NHWC" + ], + "out_args": [ + "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30", + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_19", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36" + ], + "const_args": [ + "GroupNorm_19_wts_6_0_13" + ], + "out_args": [ + "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_31-/down_blocks.3/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19" + ], + "const_args": [ + "NhwcConv_31_weight_NHWC" + ], + "out_args": [ + "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29", + "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_20", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" + ], + "const_args": [ + "GroupNorm_20_wts_6_0_14" + ], + "out_args": [ + "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_32-/down_blocks.3/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20" + ], + "const_args": [ + "NhwcConv_32_weight_NHWC" + ], + "out_args": [ + "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32", + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_21", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38" + ], + "const_args": [ + "GroupNorm_21_wts_6_0_15" + ], + "out_args": [ + "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_33-/down_blocks.3/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21" + ], + "const_args": [ + "NhwcConv_33_weight_NHWC" + ], + "out_args": [ + "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/down_blocks.3/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37", + "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33" + ], + "const_args": [], + "out_args": [ + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_22", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" + ], + "const_args": [ + "GroupNorm_22_wts_6_0_16" + ], + "out_args": [ + "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_34-/mid_block/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22" + ], + "const_args": [ + "NhwcConv_34_weight_NHWC" + ], + "out_args": [ + "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34", + "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_23", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40" + ], + "const_args": [ + "GroupNorm_23_wts_6_0_17" + ], + "out_args": [ + "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_35-/mid_block/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23" + ], + "const_args": [ + "NhwcConv_35_weight_NHWC" + ], + "out_args": [ + "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39", + "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_24", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" + ], + "const_args": [ + "GroupNorm_24_wts_6_2_6" + ], + "out_args": [ + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_36-/mid_block/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24" + ], + "const_args": [ + "NhwcConv_36_weight_NHWC" + ], + "out_args": [ + "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm1.weight", + "mid_block.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" + ], + "const_args": [ + "Attention_6_qkv_weight_key" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" + ], + "const_args": [ + "Attention_6_qkv_weight_query" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18" + ], + "const_args": [ + "Attention_6_qkv_weight_value" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_6", + "type": "SDFlatMHA", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "160", + "64" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123" + ], + "const_args": [ + "onnx::MatMul_5846_11_0_24" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123", + "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm2.weight", + "mid_block.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19" + ], + "const_args": [ + "onnx::MatMul_5847" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "64", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_6", + "type": "SDFlatMHA", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13" + ], + "const_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124" + ], + "const_args": [ + "onnx::MatMul_5857_11_0_25" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124", + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" + ], + "const_args": [ + "mid_block.attentions.0.transformer_blocks.0.norm3.weight", + "mid_block.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_6_0", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" + ], + "const_args": [ + "onnx::MatMul_5858_11_0_26_12_6_0" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_6_1", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20" + ], + "const_args": [ + "onnx::MatMul_5858_11_0_26_12_6_1" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6" + ], + "const_args": [ + "onnx::MatMul_5859_11_0_27" + ], + "out_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127", + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_37-/mid_block/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44" + ], + "const_args": [ + "NhwcConv_37_weight_NHWC" + ], + "out_args": [ + "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37", + "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41" + ], + "const_args": [], + "out_args": [ + "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_25", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45" + ], + "const_args": [ + "GroupNorm_25_wts_6_0_18" + ], + "out_args": [ + "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_38-/mid_block/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25" + ], + "const_args": [ + "NhwcConv_38_weight_NHWC" + ], + "out_args": [ + "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38", + "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_26", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46" + ], + "const_args": [ + "GroupNorm_26_wts_6_0_19" + ], + "out_args": [ + "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_39-/mid_block/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26" + ], + "const_args": [ + "NhwcConv_39_weight_NHWC" + ], + "out_args": [ + "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/mid_block/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45", + "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39" + ], + "const_args": [], + "out_args": [ + "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat", + "type": "SDConcat_bfp", + "in_args": [ + "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47", + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat.out19_1_bfp.out20_0" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_27", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/Concat.out19_1_bfp.out20_0" + ], + "const_args": [ + "GroupNorm_27_wts_6_0_20" + ], + "out_args": [ + "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_40-/up_blocks.0/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27" + ], + "const_args": [ + "NhwcConv_40_weight_NHWC" + ], + "out_args": [ + "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41", + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_28", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48" + ], + "const_args": [ + "GroupNorm_28_wts_6_0_21" + ], + "out_args": [ + "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_41-/up_blocks.0/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28" + ], + "const_args": [ + "NhwcConv_41_weight_NHWC" + ], + "out_args": [ + "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_42-/up_blocks.0/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.0/Concat.out19_1_bfp.out20_0" + ], + "const_args": [ + "NhwcConv_42_weight_NHWC" + ], + "out_args": [ + "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40", + "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat_1", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49", + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_29", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" + ], + "const_args": [ + "GroupNorm_29_wts_6_0_22" + ], + "out_args": [ + "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_43-/up_blocks.0/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29" + ], + "const_args": [ + "NhwcConv_43_weight_NHWC" + ], + "out_args": [ + "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44", + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_30", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50" + ], + "const_args": [ + "GroupNorm_30_wts_6_0_23" + ], + "out_args": [ + "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_44-/up_blocks.0/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30" + ], + "const_args": [ + "NhwcConv_44_weight_NHWC" + ], + "out_args": [ + "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_45-/up_blocks.0/resnets.1/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.0/Concat_1.out19_2_bfp.out20_1" + ], + "const_args": [ + "NhwcConv_45_weight_NHWC" + ], + "out_args": [ + "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43", + "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/Concat_2", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51", + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_31", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" + ], + "const_args": [ + "GroupNorm_31_wts_6_0_24" + ], + "out_args": [ + "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_46-/up_blocks.0/resnets.2/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31" + ], + "const_args": [ + "NhwcConv_46_weight_NHWC" + ], + "out_args": [ + "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47", + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_32", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52" + ], + "const_args": [ + "GroupNorm_32_wts_6_0_25" + ], + "out_args": [ + "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_47-/up_blocks.0/resnets.2/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32" + ], + "const_args": [ + "NhwcConv_47_weight_NHWC" + ], + "out_args": [ + "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_48-/up_blocks.0/resnets.2/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.0/Concat_2.out19_3_bfp.out20_2" + ], + "const_args": [ + "NhwcConv_48_weight_NHWC" + ], + "out_args": [ + "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/resnets.2/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46", + "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48" + ], + "const_args": [], + "out_args": [ + "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.0/upsamplers.0/Resize", + "type": "SDResize_bfp", + "in_args": [ + "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53" + ], + "const_args": [ + "/up_blocks.0/upsamplers.0/Resize.weights3_0" + ], + "out_args": [ + "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "8", + "8", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_49-/up_blocks.0/upsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0" + ], + "const_args": [ + "NhwcConv_49_weight_NHWC" + ], + "out_args": [ + "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat", + "type": "SDConcat_bfp", + "in_args": [ + "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49", + "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat.out19_4_bfp.out20_3" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_33", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/Concat.out19_4_bfp.out20_3" + ], + "const_args": [ + "GroupNorm_33_wts_6_0_26" + ], + "out_args": [ + "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_50-/up_blocks.1/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33" + ], + "const_args": [ + "NhwcConv_50_weight_NHWC" + ], + "out_args": [ + "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51", + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_34", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54" + ], + "const_args": [ + "GroupNorm_34_wts_6_0_27" + ], + "out_args": [ + "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_51-/up_blocks.1/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34" + ], + "const_args": [ + "NhwcConv_51_weight_NHWC" + ], + "out_args": [ + "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_52-/up_blocks.1/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/Concat.out19_4_bfp.out20_3" + ], + "const_args": [ + "NhwcConv_52_weight_NHWC" + ], + "out_args": [ + "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50", + "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_35", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" + ], + "const_args": [ + "GroupNorm_35_wts_6_2_7" + ], + "out_args": [ + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_53-/up_blocks.1/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35" + ], + "const_args": [ + "NhwcConv_53_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" + ], + "const_args": [ + "Attention_7_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" + ], + "const_args": [ + "Attention_7_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21" + ], + "const_args": [ + "Attention_7_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_7", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_0_6" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "256" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_0_6" + ], + "const_args": [ + "onnx::MatMul_5893_11_0_28" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131", + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22" + ], + "const_args": [ + "onnx::MatMul_5894" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21" + ], + "const_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_7", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15" + ], + "const_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132" + ], + "const_args": [ + "onnx::MatMul_5904_11_0_29" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" + ], + "const_args": [ + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_7_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" + ], + "const_args": [ + "onnx::MatMul_5905_11_0_30_12_7_0" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_7_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23" + ], + "const_args": [ + "onnx::MatMul_5905_11_0_30_12_7_1" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7" + ], + "const_args": [ + "onnx::MatMul_5906_11_0_31" + ], + "out_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_54-/up_blocks.1/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58" + ], + "const_args": [ + "NhwcConv_54_weight_NHWC" + ], + "out_args": [ + "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54", + "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat_1", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59", + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_36", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" + ], + "const_args": [ + "GroupNorm_36_wts_6_0_28" + ], + "out_args": [ + "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "5120" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_55-/up_blocks.1/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36" + ], + "const_args": [ + "NhwcConv_55_weight_NHWC" + ], + "out_args": [ + "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56", + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_37", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60" + ], + "const_args": [ + "GroupNorm_37_wts_6_0_29" + ], + "out_args": [ + "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_56-/up_blocks.1/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37" + ], + "const_args": [ + "NhwcConv_56_weight_NHWC" + ], + "out_args": [ + "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_57-/up_blocks.1/resnets.1/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/Concat_1.out19_5_bfp.out20_4" + ], + "const_args": [ + "NhwcConv_57_weight_NHWC" + ], + "out_args": [ + "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "2560" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55", + "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_38", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" + ], + "const_args": [ + "GroupNorm_38_wts_6_2_8" + ], + "out_args": [ + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_58-/up_blocks.1/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38" + ], + "const_args": [ + "NhwcConv_58_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" + ], + "const_args": [ + "Attention_8_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" + ], + "const_args": [ + "Attention_8_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24" + ], + "const_args": [ + "Attention_8_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_8", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_0_7" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "256" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_0_7" + ], + "const_args": [ + "onnx::MatMul_5923_11_0_32" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139", + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25" + ], + "const_args": [ + "onnx::MatMul_5924" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24" + ], + "const_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_8", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17" + ], + "const_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140" + ], + "const_args": [ + "onnx::MatMul_5934_11_0_33" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" + ], + "const_args": [ + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_8_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" + ], + "const_args": [ + "onnx::MatMul_5935_11_0_34_12_8_0" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_8_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26" + ], + "const_args": [ + "onnx::MatMul_5935_11_0_34_12_8_1" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8" + ], + "const_args": [ + "onnx::MatMul_5936_11_0_35" + ], + "out_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_59-/up_blocks.1/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64" + ], + "const_args": [ + "NhwcConv_59_weight_NHWC" + ], + "out_args": [ + "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59", + "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/Concat_2", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65", + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_39", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" + ], + "const_args": [ + "GroupNorm_39_wts_6_0_30" + ], + "out_args": [ + "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "3840" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_60-/up_blocks.1/resnets.2/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39" + ], + "const_args": [ + "NhwcConv_60_weight_NHWC" + ], + "out_args": [ + "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61", + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_40", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66" + ], + "const_args": [ + "GroupNorm_40_wts_6_0_31" + ], + "out_args": [ + "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_61-/up_blocks.1/resnets.2/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40" + ], + "const_args": [ + "NhwcConv_61_weight_NHWC" + ], + "out_args": [ + "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_62-/up_blocks.1/resnets.2/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/Concat_2.out19_6_bfp.out20_5" + ], + "const_args": [ + "NhwcConv_62_weight_NHWC" + ], + "out_args": [ + "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/resnets.2/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60", + "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_41", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" + ], + "const_args": [ + "GroupNorm_41_wts_6_2_9" + ], + "out_args": [ + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_63-/up_blocks.1/attentions.2/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41" + ], + "const_args": [ + "NhwcConv_63_weight_NHWC" + ], + "out_args": [ + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" + ], + "const_args": [ + "Attention_9_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" + ], + "const_args": [ + "Attention_9_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27" + ], + "const_args": [ + "Attention_9_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_9", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_0_8" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "256" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_0_8" + ], + "const_args": [ + "onnx::MatMul_5953_11_0_36" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147", + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28" + ], + "const_args": [ + "onnx::MatMul_5954" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27" + ], + "const_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "256", + "160" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_9", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "160", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19" + ], + "const_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148" + ], + "const_args": [ + "onnx::MatMul_5964_11_0_37" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" + ], + "const_args": [ + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_9_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" + ], + "const_args": [ + "onnx::MatMul_5965_11_0_38_12_9_0" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_9_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29" + ], + "const_args": [ + "onnx::MatMul_5965_11_0_38_12_9_1" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "5120" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9" + ], + "const_args": [ + "onnx::MatMul_5966_11_0_39" + ], + "out_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "256", + "5120" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "5120", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "256", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_64-/up_blocks.1/attentions.2/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70" + ], + "const_args": [ + "NhwcConv_64_weight_NHWC" + ], + "out_args": [ + "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/attentions.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64", + "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67" + ], + "const_args": [], + "out_args": [ + "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.1/upsamplers.0/Resize", + "type": "SDResize_bfp", + "in_args": [ + "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71" + ], + "const_args": [ + "/up_blocks.1/upsamplers.0/Resize.weights3_1" + ], + "out_args": [ + "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "16", + "16", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_65-/up_blocks.1/upsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1" + ], + "const_args": [ + "NhwcConv_65_weight_NHWC" + ], + "out_args": [ + "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat", + "type": "SDConcat_bfp", + "in_args": [ + "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65", + "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat.out19_7_bfp.out20_6" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_42", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/Concat.out19_7_bfp.out20_6" + ], + "const_args": [ + "GroupNorm_42_wts_6_0_32" + ], + "out_args": [ + "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "3840" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_66-/up_blocks.2/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42" + ], + "const_args": [ + "NhwcConv_66_weight_NHWC" + ], + "out_args": [ + "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67", + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_43", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72" + ], + "const_args": [ + "GroupNorm_43_wts_6_0_33" + ], + "out_args": [ + "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_67-/up_blocks.2/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43" + ], + "const_args": [ + "NhwcConv_67_weight_NHWC" + ], + "out_args": [ + "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_68-/up_blocks.2/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/Concat.out19_7_bfp.out20_6" + ], + "const_args": [ + "NhwcConv_68_weight_NHWC" + ], + "out_args": [ + "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1920" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "1920" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66", + "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_44", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" + ], + "const_args": [ + "GroupNorm_44_wts_6_2_10" + ], + "out_args": [ + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_69-/up_blocks.2/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44" + ], + "const_args": [ + "NhwcConv_69_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" + ], + "const_args": [ + "Attention_10_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" + ], + "const_args": [ + "Attention_10_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30" + ], + "const_args": [ + "Attention_10_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_10", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_0_9" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "1024" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_0_9" + ], + "const_args": [ + "onnx::MatMul_5984_11_0_40" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155", + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31" + ], + "const_args": [ + "onnx::MatMul_5985" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30" + ], + "const_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_10", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21" + ], + "const_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156" + ], + "const_args": [ + "onnx::MatMul_5995_11_0_41" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" + ], + "const_args": [ + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_10_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" + ], + "const_args": [ + "onnx::MatMul_5996_11_0_42_12_10_0" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_10_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32" + ], + "const_args": [ + "onnx::MatMul_5996_11_0_42_12_10_1" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10" + ], + "const_args": [ + "onnx::MatMul_5997_11_0_43" + ], + "out_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_70-/up_blocks.2/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76" + ], + "const_args": [ + "NhwcConv_70_weight_NHWC" + ], + "out_args": [ + "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70", + "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat_1", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77", + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_45", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" + ], + "const_args": [ + "GroupNorm_45_wts_6_0_34" + ], + "out_args": [ + "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "2560" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_71-/up_blocks.2/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45" + ], + "const_args": [ + "NhwcConv_71_weight_NHWC" + ], + "out_args": [ + "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72", + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_46", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78" + ], + "const_args": [ + "GroupNorm_46_wts_6_0_35" + ], + "out_args": [ + "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_72-/up_blocks.2/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46" + ], + "const_args": [ + "NhwcConv_72_weight_NHWC" + ], + "out_args": [ + "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_73-/up_blocks.2/resnets.1/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/Concat_1.out19_8_bfp.out20_7" + ], + "const_args": [ + "NhwcConv_73_weight_NHWC" + ], + "out_args": [ + "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "1280" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71", + "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_47", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" + ], + "const_args": [ + "GroupNorm_47_wts_6_2_11" + ], + "out_args": [ + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_74-/up_blocks.2/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47" + ], + "const_args": [ + "NhwcConv_74_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" + ], + "const_args": [ + "Attention_11_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" + ], + "const_args": [ + "Attention_11_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33" + ], + "const_args": [ + "Attention_11_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_11", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_0_10" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "1024" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_0_10" + ], + "const_args": [ + "onnx::MatMul_6014_11_0_44" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163", + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34" + ], + "const_args": [ + "onnx::MatMul_6015" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33" + ], + "const_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_11", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23" + ], + "const_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164" + ], + "const_args": [ + "onnx::MatMul_6025_11_0_45" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" + ], + "const_args": [ + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_11_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" + ], + "const_args": [ + "onnx::MatMul_6026_11_0_46_12_11_0" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_11_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35" + ], + "const_args": [ + "onnx::MatMul_6026_11_0_46_12_11_1" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11" + ], + "const_args": [ + "onnx::MatMul_6027_11_0_47" + ], + "out_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_75-/up_blocks.2/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82" + ], + "const_args": [ + "NhwcConv_75_weight_NHWC" + ], + "out_args": [ + "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75", + "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/Concat_2", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83", + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_48", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" + ], + "const_args": [ + "GroupNorm_48_wts_6_0_36" + ], + "out_args": [ + "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "960" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "960" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_76-/up_blocks.2/resnets.2/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48" + ], + "const_args": [ + "NhwcConv_76_weight_NHWC" + ], + "out_args": [ + "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77", + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_49", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84" + ], + "const_args": [ + "GroupNorm_49_wts_6_0_37" + ], + "out_args": [ + "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_77-/up_blocks.2/resnets.2/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49" + ], + "const_args": [ + "NhwcConv_77_weight_NHWC" + ], + "out_args": [ + "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_78-/up_blocks.2/resnets.2/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/Concat_2.out19_9_bfp.out20_8" + ], + "const_args": [ + "NhwcConv_78_weight_NHWC" + ], + "out_args": [ + "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/resnets.2/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76", + "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_50", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" + ], + "const_args": [ + "GroupNorm_50_wts_6_2_12" + ], + "out_args": [ + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_79-/up_blocks.2/attentions.2/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50" + ], + "const_args": [ + "NhwcConv_79_weight_NHWC" + ], + "out_args": [ + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" + ], + "const_args": [ + "Attention_12_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" + ], + "const_args": [ + "Attention_12_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36" + ], + "const_args": [ + "Attention_12_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_12", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_0_11" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "1024" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_0_11" + ], + "const_args": [ + "onnx::MatMul_6044_11_0_48" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171", + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37" + ], + "const_args": [ + "onnx::MatMul_6045" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36" + ], + "const_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "1024", + "80" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_12", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "80", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25" + ], + "const_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172" + ], + "const_args": [ + "onnx::MatMul_6055_11_0_49" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" + ], + "const_args": [ + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_12_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" + ], + "const_args": [ + "onnx::MatMul_6056_11_0_50_12_12_0" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_12_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38" + ], + "const_args": [ + "onnx::MatMul_6056_11_0_50_12_12_1" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "2560" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12" + ], + "const_args": [ + "onnx::MatMul_6057_11_0_51" + ], + "out_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "1024", + "2560" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "2560", + "640" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "1024", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_80-/up_blocks.2/attentions.2/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88" + ], + "const_args": [ + "NhwcConv_80_weight_NHWC" + ], + "out_args": [ + "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/attentions.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80", + "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85" + ], + "const_args": [], + "out_args": [ + "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.2/upsamplers.0/Resize", + "type": "SDResize_bfp", + "in_args": [ + "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89" + ], + "const_args": [ + "/up_blocks.2/upsamplers.0/Resize.weights3_2" + ], + "out_args": [ + "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "32", + "32", + "640" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_81-/up_blocks.2/upsamplers.0/conv/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2" + ], + "const_args": [ + "NhwcConv_81_weight_NHWC" + ], + "out_args": [ + "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "640", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat", + "type": "SDConcat_bfp", + "in_args": [ + "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81", + "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat.out19_10_bfp.out20_9" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_51", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/Concat.out19_10_bfp.out20_9" + ], + "const_args": [ + "GroupNorm_51_wts_6_0_38" + ], + "out_args": [ + "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1920" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "960" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "960" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_82-/up_blocks.3/resnets.0/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51" + ], + "const_args": [ + "NhwcConv_82_weight_NHWC" + ], + "out_args": [ + "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83", + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_52", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90" + ], + "const_args": [ + "GroupNorm_52_wts_6_0_39" + ], + "out_args": [ + "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_83-/up_blocks.3/resnets.0/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52" + ], + "const_args": [ + "NhwcConv_83_weight_NHWC" + ], + "out_args": [ + "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_84-/up_blocks.3/resnets.0/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/Concat.out19_10_bfp.out20_9" + ], + "const_args": [ + "NhwcConv_84_weight_NHWC" + ], + "out_args": [ + "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "960" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "960" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82", + "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_53", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" + ], + "const_args": [ + "GroupNorm_53_wts_6_2_13" + ], + "out_args": [ + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_85-/up_blocks.3/attentions.0/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53" + ], + "const_args": [ + "NhwcConv_85_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" + ], + "const_args": [ + "Attention_13_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" + ], + "const_args": [ + "Attention_13_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39" + ], + "const_args": [ + "Attention_13_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_13", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_0_12" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "4096" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_0_12" + ], + "const_args": [ + "onnx::MatMul_6075_11_0_52" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179", + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40" + ], + "const_args": [ + "onnx::MatMul_6076" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39" + ], + "const_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_13", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27" + ], + "const_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180" + ], + "const_args": [ + "onnx::MatMul_6086_11_0_53" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" + ], + "const_args": [ + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_13_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" + ], + "const_args": [ + "onnx::MatMul_6087_11_0_54_12_13_0" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_13_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41" + ], + "const_args": [ + "onnx::MatMul_6087_11_0_54_12_13_1" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13" + ], + "const_args": [ + "onnx::MatMul_6088_11_0_55" + ], + "out_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_86-/up_blocks.3/attentions.0/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94" + ], + "const_args": [ + "NhwcConv_86_weight_NHWC" + ], + "out_args": [ + "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86", + "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat_1", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95", + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_54", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" + ], + "const_args": [ + "GroupNorm_54_wts_6_0_40" + ], + "out_args": [ + "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_87-/up_blocks.3/resnets.1/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54" + ], + "const_args": [ + "NhwcConv_87_weight_NHWC" + ], + "out_args": [ + "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88", + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_55", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96" + ], + "const_args": [ + "GroupNorm_55_wts_6_0_41" + ], + "out_args": [ + "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_88-/up_blocks.3/resnets.1/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55" + ], + "const_args": [ + "NhwcConv_88_weight_NHWC" + ], + "out_args": [ + "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_89-/up_blocks.3/resnets.1/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/Concat_1.out19_11_bfp.out20_10" + ], + "const_args": [ + "NhwcConv_89_weight_NHWC" + ], + "out_args": [ + "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.1/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87", + "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_56", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" + ], + "const_args": [ + "GroupNorm_56_wts_6_2_14" + ], + "out_args": [ + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_90-/up_blocks.3/attentions.1/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56" + ], + "const_args": [ + "NhwcConv_90_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" + ], + "const_args": [ + "Attention_14_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" + ], + "const_args": [ + "Attention_14_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42" + ], + "const_args": [ + "Attention_14_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_14", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_0_13" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "4096" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_0_13" + ], + "const_args": [ + "onnx::MatMul_6105_11_0_56" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187", + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43" + ], + "const_args": [ + "onnx::MatMul_6106" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42" + ], + "const_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_14", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29" + ], + "const_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188" + ], + "const_args": [ + "onnx::MatMul_6116_11_0_57" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" + ], + "const_args": [ + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_14_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" + ], + "const_args": [ + "onnx::MatMul_6117_11_0_58_12_14_0" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_14_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44" + ], + "const_args": [ + "onnx::MatMul_6117_11_0_58_12_14_1" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14" + ], + "const_args": [ + "onnx::MatMul_6118_11_0_59" + ], + "out_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_91-/up_blocks.3/attentions.1/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100" + ], + "const_args": [ + "NhwcConv_91_weight_NHWC" + ], + "out_args": [ + "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.1/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91", + "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/Concat_2", + "type": "SDConcat_bfp", + "in_args": [ + "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101", + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "3" + ] + }, + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_57", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" + ], + "const_args": [ + "GroupNorm_57_wts_6_0_42" + ], + "out_args": [ + "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1280" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_92-/up_blocks.3/resnets.2/conv1/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57" + ], + "const_args": [ + "NhwcConv_92_weight_NHWC" + ], + "out_args": [ + "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93", + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "1", + "1", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_58", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102" + ], + "const_args": [ + "GroupNorm_58_wts_6_0_43" + ], + "out_args": [ + "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_93-/up_blocks.3/resnets.2/conv2/Conv", + "type": "SDConv_bfp", + "in_args": [ + "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58" + ], + "const_args": [ + "NhwcConv_93_weight_NHWC" + ], + "out_args": [ + "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_94-/up_blocks.3/resnets.2/conv_shortcut/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/Concat_2.out19_12_bfp.out20_11" + ], + "const_args": [ + "NhwcConv_94_weight_NHWC" + ], + "out_args": [ + "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "640" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "640" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/resnets.2/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92", + "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_59", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" + ], + "const_args": [ + "GroupNorm_59_wts_6_2_15" + ], + "out_args": [ + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_95-/up_blocks.3/attentions.2/proj_in/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59" + ], + "const_args": [ + "NhwcConv_95_weight_NHWC" + ], + "out_args": [ + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_key", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" + ], + "const_args": [ + "Attention_15_qkv_weight_key" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_query", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" + ], + "const_args": [ + "Attention_15_qkv_weight_query" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_MatMul_value", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45" + ], + "const_args": [ + "Attention_15_qkv_weight_value" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "3" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Attention_15", + "type": "SDMHA_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_0_14" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "4096" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v2" + ] + }, + "is_flash_mha": { + "type": "int", + "value": [ + "1" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_0_14" + ], + "const_args": [ + "onnx::MatMul_6135_11_0_60" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195", + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46" + ], + "const_args": [ + "onnx::MatMul_6136" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "head_num": { + "type": "int", + "value": [ + "8" + ] + }, + "trans_head": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45" + ], + "const_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "8", + "4096", + "40" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "MultiHeadAttention_15", + "type": "SDFlatMHA", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "8" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "40", + "77" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "op_version": { + "type": "str", + "value": [ + "v1.1" + ] + }, + "is_flat_mha_1_1": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_SDCastBf2Bfp", + "type": "SDCastBf2Bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31" + ], + "const_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196" + ], + "const_args": [ + "onnx::MatMul_6146_11_0_61" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization", + "type": "SDLayerNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" + ], + "const_args": [ + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" + ], + "attrs": { + "axis": { + "type": "int", + "value": [ + "-1" + ] + }, + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "stash_type": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_15_0", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" + ], + "const_args": [ + "onnx::MatMul_6147_11_0_62_12_15_0" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Gelu" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/proj/MatMul/MatMulAddFusion_12_15_1", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47" + ], + "const_args": [ + "onnx::MatMul_6147_11_0_62_12_15_1" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1280" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4", + "type": "SDMul_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/MatMul/MatMulAddFusion", + "type": "SDGemm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15" + ], + "const_args": [ + "onnx::MatMul_6148_11_0_63" + ], + "out_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "4096", + "1280" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "1280", + "320" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/transformer_blocks.0/Add_2", + "type": "SDAdd_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "4096", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_96-/up_blocks.3/attentions.2/proj_out/Conv", + "type": "SDConv_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106" + ], + "const_args": [ + "NhwcConv_96_weight_NHWC" + ], + "out_args": [ + "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "320", + "1", + "1", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/up_blocks.3/attentions.2/Add", + "type": "SDAdd_bfp", + "in_args": [ + "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96", + "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103" + ], + "const_args": [], + "out_args": [ + "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_60", + "type": "SDGroupNorm_bfp", + "in_args": [ + "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107" + ], + "const_args": [ + "GroupNorm_60_wts_6_0_44" + ], + "out_args": [ + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999747378752e-06" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "640" + ] + }, + "gamma_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "beta_shape": { + "type": "int", + "value": [ + "320" + ] + }, + "nonlinear": { + "type": "str", + "value": [ + "Silu" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_SDCastBfp2Bf", + "type": "SDCastBfp2Bf", + "in_args": [ + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60" + ], + "const_args": [ + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts" + ], + "out_args": [ + "GroupNorm_60.out7_60.out6_0_44" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfp16ebs8" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_97-/conv_out/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_60.out7_60.out6_0_44" + ], + "const_args": [ + "NhwcConv_97_weight_NHWC" + ], + "out_args": [ + "NhwcConv_97_out-out_sample.out0_1_81" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "320" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "2", + "64", + "64", + "4" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "4", + "3", + "3", + "320" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + } + ], + "fused_tensors": { + "in": { + "buffer_size": 7636224, + "xrt_arg_id": 0, + "packed_tensors": [ + "Transpose_44_out-sample.out0_1_0", + "encoder_hidden_states.out2_6_0", + "/time_proj/Concat_1_output_0.out2_3_0" + ] + }, + "out": { + "buffer_size": 65536, + "xrt_arg_id": 1, + "packed_tensors": [ + "NhwcConv_97_out-out_sample.out0_1_81" + ] + }, + "scratch": { + "buffer_size": 1059969280, + "xrt_arg_id": 2, + "packed_tensors": [ + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0", + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0", + "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13", + "/time_embedding/linear_1/Gemm_output_0.out2_3_0", + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0", + "/time_embedding/linear_2/Gemm_output_0.out2_3_1", + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1", + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0", + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1", + "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0", + "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1", + "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2", + "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1", + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2", + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_0_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76", + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3", + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0", + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79", + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4", + "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4", + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5", + "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3", + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1", + "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5", + "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6", + "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4", + "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6", + "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7", + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5", + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_0_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84", + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9", + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1", + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87", + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10", + "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8", + "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11", + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9", + "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6", + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2", + "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11", + "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12", + "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7", + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3", + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4", + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5", + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6", + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7", + "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8", + "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9", + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10", + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11", + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19", + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13", + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14", + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25", + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16", + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17", + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31", + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19", + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20", + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21", + "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12", + "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10", + "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13", + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8", + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_0_2", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92", + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15", + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2", + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95", + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16", + "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14", + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17", + "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9", + "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15", + "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18", + "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10", + "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16", + "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19", + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11", + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_0_3", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100", + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21", + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3", + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103", + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22", + "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18", + "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23", + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19", + "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12", + "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21", + "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24", + "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13", + "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22", + "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20", + "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25", + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14", + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_0_4", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108", + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27", + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4", + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111", + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28", + "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24", + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29", + "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15", + "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25", + "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30", + "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16", + "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26", + "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31", + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17", + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_0_5", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116", + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33", + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5", + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119", + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34", + "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28", + "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35", + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29", + "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18", + "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30", + "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36", + "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19", + "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31", + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37", + "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20", + "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32", + "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38", + "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21", + "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33", + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39", + "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22", + "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34", + "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40", + "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23", + "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35", + "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41", + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24", + "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20", + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12", + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123", + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123", + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42", + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38", + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13", + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124", + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43", + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6", + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127", + "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44", + "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37", + "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45", + "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25", + "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38", + "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46", + "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26", + "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39", + "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47", + "/up_blocks.0/Concat.out19_1_bfp.out20_0", + "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27", + "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41", + "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48", + "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28", + "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42", + "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40", + "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49", + "/up_blocks.0/Concat_1.out19_2_bfp.out20_1", + "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29", + "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44", + "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50", + "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30", + "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45", + "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43", + "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51", + "/up_blocks.0/Concat_2.out19_3_bfp.out20_2", + "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31", + "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47", + "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52", + "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32", + "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48", + "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46", + "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53", + "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0", + "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49", + "/up_blocks.1/Concat.out19_4_bfp.out20_3", + "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33", + "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51", + "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54", + "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34", + "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52", + "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50", + "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55", + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35", + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_0_6", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132", + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57", + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7", + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135", + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58", + "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54", + "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59", + "/up_blocks.1/Concat_1.out19_5_bfp.out20_4", + "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36", + "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56", + "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60", + "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37", + "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57", + "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55", + "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61", + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38", + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_0_7", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140", + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63", + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8", + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143", + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64", + "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59", + "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65", + "/up_blocks.1/Concat_2.out19_6_bfp.out20_5", + "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39", + "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61", + "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66", + "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40", + "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62", + "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60", + "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67", + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41", + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_0_8", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148", + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69", + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9", + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151", + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70", + "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64", + "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71", + "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1", + "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65", + "/up_blocks.2/Concat.out19_7_bfp.out20_6", + "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42", + "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67", + "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72", + "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43", + "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68", + "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66", + "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73", + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44", + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_0_9", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156", + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75", + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10", + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159", + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76", + "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70", + "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77", + "/up_blocks.2/Concat_1.out19_8_bfp.out20_7", + "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45", + "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72", + "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78", + "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46", + "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73", + "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71", + "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79", + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47", + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_0_10", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164", + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81", + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11", + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167", + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82", + "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75", + "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83", + "/up_blocks.2/Concat_2.out19_9_bfp.out20_8", + "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48", + "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77", + "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84", + "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49", + "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78", + "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76", + "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85", + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50", + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_0_11", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172", + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87", + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12", + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175", + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88", + "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80", + "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89", + "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2", + "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81", + "/up_blocks.3/Concat.out19_10_bfp.out20_9", + "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51", + "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83", + "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90", + "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52", + "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84", + "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82", + "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91", + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53", + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_0_12", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180", + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93", + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13", + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183", + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94", + "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86", + "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95", + "/up_blocks.3/Concat_1.out19_11_bfp.out20_10", + "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54", + "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88", + "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96", + "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55", + "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89", + "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87", + "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97", + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56", + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_0_13", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188", + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99", + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14", + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191", + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100", + "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91", + "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101", + "/up_blocks.3/Concat_2.out19_12_bfp.out20_11", + "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57", + "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93", + "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102", + "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58", + "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94", + "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92", + "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103", + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59", + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_0_14", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196", + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105", + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15", + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199", + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106", + "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96", + "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107", + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60", + "GroupNorm_60.out7_60.out6_0_44" + ] + }, + "const": { + "buffer_size": 990732224, + "xrt_arg_id": 3, + "packed_tensors": [ + "NhwcConv_0_weight_NHWC", + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts", + "GroupNorm_0_wts_6_0_0", + "onnx::MatMul_5660", + "onnx::MatMul_5661", + "onnx::MatMul_5690", + "onnx::MatMul_5691", + "onnx::MatMul_5720", + "onnx::MatMul_5721", + "onnx::MatMul_5750", + "onnx::MatMul_5751", + "onnx::MatMul_5780", + "onnx::MatMul_5781", + "onnx::MatMul_5810", + "onnx::MatMul_5811", + "onnx::MatMul_5848", + "onnx::MatMul_5849", + "time_embedding.linear_1.weight_11_1_0", + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0", + "time_embedding.linear_2.weight_11_1_1", + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1", + "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2", + "NhwcConv_1_weight_NHWC", + "GroupNorm_1_wts_6_0_1", + "NhwcConv_2_weight_NHWC", + "GroupNorm_2_wts_6_2_0", + "NhwcConv_3_weight_NHWC", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_0_qkv_weight_key", + "Attention_0_qkv_weight_query", + "Attention_0_qkv_weight_value", + "onnx::MatMul_5658_11_0_0", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5659", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0_bfp.wts", + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts", + "onnx::MatMul_5669_11_0_1", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5670_11_0_2_12_0_0", + "onnx::MatMul_5670_11_0_2_12_0_1", + "onnx::MatMul_5671_11_0_3", + "NhwcConv_4_weight_NHWC", + "GroupNorm_3_wts_6_0_2", + "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3", + "NhwcConv_5_weight_NHWC", + "GroupNorm_4_wts_6_0_3", + "NhwcConv_6_weight_NHWC", + "GroupNorm_5_wts_6_2_1", + "NhwcConv_7_weight_NHWC", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_1_qkv_weight_key", + "Attention_1_qkv_weight_query", + "Attention_1_qkv_weight_value", + "onnx::MatMul_5688_11_0_4", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5689", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3_bfp.wts", + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts", + "onnx::MatMul_5699_11_0_5", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5700_11_0_6_12_1_0", + "onnx::MatMul_5700_11_0_6_12_1_1", + "onnx::MatMul_5701_11_0_7", + "NhwcConv_8_weight_NHWC", + "NhwcConv_9_weight_NHWC", + "GroupNorm_6_wts_6_0_4", + "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4", + "NhwcConv_10_weight_NHWC", + "GroupNorm_7_wts_6_0_5", + "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5", + "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6", + "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7", + "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8", + "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9", + "mid_block.resnets.0.time_emb_proj.weight_11_1_10", + "mid_block.resnets.1.time_emb_proj.weight_11_1_11", + "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12", + "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13", + "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14", + "onnx::MatMul_5895", + "onnx::MatMul_5896", + "onnx::MatMul_5925", + "onnx::MatMul_5926", + "onnx::MatMul_5955", + "onnx::MatMul_5956", + "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15", + "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16", + "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17", + "onnx::MatMul_5986", + "onnx::MatMul_5987", + "onnx::MatMul_6016", + "onnx::MatMul_6017", + "onnx::MatMul_6046", + "onnx::MatMul_6047", + "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18", + "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19", + "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20", + "onnx::MatMul_6077", + "onnx::MatMul_6078", + "onnx::MatMul_6107", + "onnx::MatMul_6108", + "onnx::MatMul_6137", + "onnx::MatMul_6138", + "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21", + "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22", + "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23", + "NhwcConv_11_weight_NHWC", + "NhwcConv_12_weight_NHWC", + "GroupNorm_8_wts_6_2_2", + "NhwcConv_13_weight_NHWC", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_2_qkv_weight_key", + "Attention_2_qkv_weight_query", + "Attention_2_qkv_weight_value", + "onnx::MatMul_5718_11_0_8", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5719", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6_bfp.wts", + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts", + "onnx::MatMul_5729_11_0_9", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5730_11_0_10_12_2_0", + "onnx::MatMul_5730_11_0_10_12_2_1", + "onnx::MatMul_5731_11_0_11", + "NhwcConv_14_weight_NHWC", + "GroupNorm_9_wts_6_0_6", + "NhwcConv_15_weight_NHWC", + "GroupNorm_10_wts_6_0_7", + "NhwcConv_16_weight_NHWC", + "GroupNorm_11_wts_6_2_3", + "NhwcConv_17_weight_NHWC", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_3_qkv_weight_key", + "Attention_3_qkv_weight_query", + "Attention_3_qkv_weight_value", + "onnx::MatMul_5748_11_0_12", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5749", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9_bfp.wts", + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts", + "onnx::MatMul_5759_11_0_13", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5760_11_0_14_12_3_0", + "onnx::MatMul_5760_11_0_14_12_3_1", + "onnx::MatMul_5761_11_0_15", + "NhwcConv_18_weight_NHWC", + "NhwcConv_19_weight_NHWC", + "GroupNorm_12_wts_6_0_8", + "NhwcConv_20_weight_NHWC", + "GroupNorm_13_wts_6_0_9", + "NhwcConv_21_weight_NHWC", + "NhwcConv_22_weight_NHWC", + "GroupNorm_14_wts_6_2_4", + "NhwcConv_23_weight_NHWC", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_4_qkv_weight_key", + "Attention_4_qkv_weight_query", + "Attention_4_qkv_weight_value", + "onnx::MatMul_5778_11_0_16", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5779", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12_bfp.wts", + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts", + "onnx::MatMul_5789_11_0_17", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5790_11_0_18_12_4_0", + "onnx::MatMul_5790_11_0_18_12_4_1", + "onnx::MatMul_5791_11_0_19", + "NhwcConv_24_weight_NHWC", + "GroupNorm_15_wts_6_0_10", + "NhwcConv_25_weight_NHWC", + "GroupNorm_16_wts_6_0_11", + "NhwcConv_26_weight_NHWC", + "GroupNorm_17_wts_6_2_5", + "NhwcConv_27_weight_NHWC", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_5_qkv_weight_key", + "Attention_5_qkv_weight_query", + "Attention_5_qkv_weight_value", + "onnx::MatMul_5808_11_0_20", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5809", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15_bfp.wts", + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts", + "onnx::MatMul_5819_11_0_21", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5820_11_0_22_12_5_0", + "onnx::MatMul_5820_11_0_22_12_5_1", + "onnx::MatMul_5821_11_0_23", + "NhwcConv_28_weight_NHWC", + "NhwcConv_29_weight_NHWC", + "GroupNorm_18_wts_6_0_12", + "NhwcConv_30_weight_NHWC", + "GroupNorm_19_wts_6_0_13", + "NhwcConv_31_weight_NHWC", + "GroupNorm_20_wts_6_0_14", + "NhwcConv_32_weight_NHWC", + "GroupNorm_21_wts_6_0_15", + "NhwcConv_33_weight_NHWC", + "GroupNorm_22_wts_6_0_16", + "NhwcConv_34_weight_NHWC", + "GroupNorm_23_wts_6_0_17", + "NhwcConv_35_weight_NHWC", + "GroupNorm_24_wts_6_2_6", + "NhwcConv_36_weight_NHWC", + "mid_block.attentions.0.transformer_blocks.0.norm1.weight", + "mid_block.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_6_qkv_weight_key", + "Attention_6_qkv_weight_query", + "Attention_6_qkv_weight_value", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121_bfp.wts", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120_bfp.wts", + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122_bfp.wts", + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts", + "onnx::MatMul_5846_11_0_24", + "mid_block.attentions.0.transformer_blocks.0.norm2.weight", + "mid_block.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5847", + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18_bfp.wts", + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts", + "onnx::MatMul_5857_11_0_25", + "mid_block.attentions.0.transformer_blocks.0.norm3.weight", + "mid_block.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5858_11_0_26_12_6_0", + "onnx::MatMul_5858_11_0_26_12_6_1", + "onnx::MatMul_5859_11_0_27", + "NhwcConv_37_weight_NHWC", + "GroupNorm_25_wts_6_0_18", + "NhwcConv_38_weight_NHWC", + "GroupNorm_26_wts_6_0_19", + "NhwcConv_39_weight_NHWC", + "GroupNorm_27_wts_6_0_20", + "NhwcConv_40_weight_NHWC", + "GroupNorm_28_wts_6_0_21", + "NhwcConv_41_weight_NHWC", + "NhwcConv_42_weight_NHWC", + "GroupNorm_29_wts_6_0_22", + "NhwcConv_43_weight_NHWC", + "GroupNorm_30_wts_6_0_23", + "NhwcConv_44_weight_NHWC", + "NhwcConv_45_weight_NHWC", + "GroupNorm_31_wts_6_0_24", + "NhwcConv_46_weight_NHWC", + "GroupNorm_32_wts_6_0_25", + "NhwcConv_47_weight_NHWC", + "NhwcConv_48_weight_NHWC", + "/up_blocks.0/upsamplers.0/Resize.weights3_0", + "NhwcConv_49_weight_NHWC", + "GroupNorm_33_wts_6_0_26", + "NhwcConv_50_weight_NHWC", + "GroupNorm_34_wts_6_0_27", + "NhwcConv_51_weight_NHWC", + "NhwcConv_52_weight_NHWC", + "GroupNorm_35_wts_6_2_7", + "NhwcConv_53_weight_NHWC", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_7_qkv_weight_key", + "Attention_7_qkv_weight_query", + "Attention_7_qkv_weight_value", + "onnx::MatMul_5893_11_0_28", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5894", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21_bfp.wts", + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts", + "onnx::MatMul_5904_11_0_29", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5905_11_0_30_12_7_0", + "onnx::MatMul_5905_11_0_30_12_7_1", + "onnx::MatMul_5906_11_0_31", + "NhwcConv_54_weight_NHWC", + "GroupNorm_36_wts_6_0_28", + "NhwcConv_55_weight_NHWC", + "GroupNorm_37_wts_6_0_29", + "NhwcConv_56_weight_NHWC", + "NhwcConv_57_weight_NHWC", + "GroupNorm_38_wts_6_2_8", + "NhwcConv_58_weight_NHWC", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_8_qkv_weight_key", + "Attention_8_qkv_weight_query", + "Attention_8_qkv_weight_value", + "onnx::MatMul_5923_11_0_32", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5924", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24_bfp.wts", + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts", + "onnx::MatMul_5934_11_0_33", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5935_11_0_34_12_8_0", + "onnx::MatMul_5935_11_0_34_12_8_1", + "onnx::MatMul_5936_11_0_35", + "NhwcConv_59_weight_NHWC", + "GroupNorm_39_wts_6_0_30", + "NhwcConv_60_weight_NHWC", + "GroupNorm_40_wts_6_0_31", + "NhwcConv_61_weight_NHWC", + "NhwcConv_62_weight_NHWC", + "GroupNorm_41_wts_6_2_9", + "NhwcConv_63_weight_NHWC", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias", + "Attention_9_qkv_weight_key", + "Attention_9_qkv_weight_query", + "Attention_9_qkv_weight_value", + "onnx::MatMul_5953_11_0_36", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5954", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27_bfp.wts", + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts", + "onnx::MatMul_5964_11_0_37", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5965_11_0_38_12_9_0", + "onnx::MatMul_5965_11_0_38_12_9_1", + "onnx::MatMul_5966_11_0_39", + "NhwcConv_64_weight_NHWC", + "/up_blocks.1/upsamplers.0/Resize.weights3_1", + "NhwcConv_65_weight_NHWC", + "GroupNorm_42_wts_6_0_32", + "NhwcConv_66_weight_NHWC", + "GroupNorm_43_wts_6_0_33", + "NhwcConv_67_weight_NHWC", + "NhwcConv_68_weight_NHWC", + "GroupNorm_44_wts_6_2_10", + "NhwcConv_69_weight_NHWC", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_10_qkv_weight_key", + "Attention_10_qkv_weight_query", + "Attention_10_qkv_weight_value", + "onnx::MatMul_5984_11_0_40", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_5985", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30_bfp.wts", + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts", + "onnx::MatMul_5995_11_0_41", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_5996_11_0_42_12_10_0", + "onnx::MatMul_5996_11_0_42_12_10_1", + "onnx::MatMul_5997_11_0_43", + "NhwcConv_70_weight_NHWC", + "GroupNorm_45_wts_6_0_34", + "NhwcConv_71_weight_NHWC", + "GroupNorm_46_wts_6_0_35", + "NhwcConv_72_weight_NHWC", + "NhwcConv_73_weight_NHWC", + "GroupNorm_47_wts_6_2_11", + "NhwcConv_74_weight_NHWC", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_11_qkv_weight_key", + "Attention_11_qkv_weight_query", + "Attention_11_qkv_weight_value", + "onnx::MatMul_6014_11_0_44", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6015", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33_bfp.wts", + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts", + "onnx::MatMul_6025_11_0_45", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6026_11_0_46_12_11_0", + "onnx::MatMul_6026_11_0_46_12_11_1", + "onnx::MatMul_6027_11_0_47", + "NhwcConv_75_weight_NHWC", + "GroupNorm_48_wts_6_0_36", + "NhwcConv_76_weight_NHWC", + "GroupNorm_49_wts_6_0_37", + "NhwcConv_77_weight_NHWC", + "NhwcConv_78_weight_NHWC", + "GroupNorm_50_wts_6_2_12", + "NhwcConv_79_weight_NHWC", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias", + "Attention_12_qkv_weight_key", + "Attention_12_qkv_weight_query", + "Attention_12_qkv_weight_value", + "onnx::MatMul_6044_11_0_48", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6045", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36_bfp.wts", + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts", + "onnx::MatMul_6055_11_0_49", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6056_11_0_50_12_12_0", + "onnx::MatMul_6056_11_0_50_12_12_1", + "onnx::MatMul_6057_11_0_51", + "NhwcConv_80_weight_NHWC", + "/up_blocks.2/upsamplers.0/Resize.weights3_2", + "NhwcConv_81_weight_NHWC", + "GroupNorm_51_wts_6_0_38", + "NhwcConv_82_weight_NHWC", + "GroupNorm_52_wts_6_0_39", + "NhwcConv_83_weight_NHWC", + "NhwcConv_84_weight_NHWC", + "GroupNorm_53_wts_6_2_13", + "NhwcConv_85_weight_NHWC", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias", + "Attention_13_qkv_weight_key", + "Attention_13_qkv_weight_query", + "Attention_13_qkv_weight_value", + "onnx::MatMul_6075_11_0_52", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6076", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39_bfp.wts", + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts", + "onnx::MatMul_6086_11_0_53", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6087_11_0_54_12_13_0", + "onnx::MatMul_6087_11_0_54_12_13_1", + "onnx::MatMul_6088_11_0_55", + "NhwcConv_86_weight_NHWC", + "GroupNorm_54_wts_6_0_40", + "NhwcConv_87_weight_NHWC", + "GroupNorm_55_wts_6_0_41", + "NhwcConv_88_weight_NHWC", + "NhwcConv_89_weight_NHWC", + "GroupNorm_56_wts_6_2_14", + "NhwcConv_90_weight_NHWC", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias", + "Attention_14_qkv_weight_key", + "Attention_14_qkv_weight_query", + "Attention_14_qkv_weight_value", + "onnx::MatMul_6105_11_0_56", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6106", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42_bfp.wts", + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts", + "onnx::MatMul_6116_11_0_57", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6117_11_0_58_12_14_0", + "onnx::MatMul_6117_11_0_58_12_14_1", + "onnx::MatMul_6118_11_0_59", + "NhwcConv_91_weight_NHWC", + "GroupNorm_57_wts_6_0_42", + "NhwcConv_92_weight_NHWC", + "GroupNorm_58_wts_6_0_43", + "NhwcConv_93_weight_NHWC", + "NhwcConv_94_weight_NHWC", + "GroupNorm_59_wts_6_2_15", + "NhwcConv_95_weight_NHWC", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias", + "Attention_15_qkv_weight_key", + "Attention_15_qkv_weight_query", + "Attention_15_qkv_weight_value", + "onnx::MatMul_6135_11_0_60", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias", + "onnx::MatMul_6136", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45_bfp.wts", + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts", + "onnx::MatMul_6146_11_0_61", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight", + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias", + "onnx::MatMul_6147_11_0_62_12_15_0", + "onnx::MatMul_6147_11_0_62_12_15_1", + "onnx::MatMul_6148_11_0_63", + "NhwcConv_96_weight_NHWC", + "GroupNorm_60_wts_6_0_44", + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts", + "NhwcConv_97_weight_NHWC" + ] + }, + "super_instr": { + "buffer_size": 0, + "xrt_arg_id": 4, + "packed_tensors": [] + } + }, + "tensor_map": { + "Transpose_44_out-sample.out0_1_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 4 + ], + "size_in_bytes": 65536, + "op_tensor_size": 65536, + "offset": 0 + }, + "encoder_hidden_states.out2_6_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 77, + 768 + ], + "size_in_bytes": 236544, + "op_tensor_size": 236544, + "offset": 7399680 + }, + "/time_proj/Concat_1_output_0.out2_3_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 2, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 3377152 + }, + "NhwcConv_97_out-out_sample.out0_1_81": { + "packed_buffer_label": "out", + "xrt_arg_id": 1, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 4 + ], + "size_in_bytes": 65536, + "op_tensor_size": 65536, + "offset": 0 + }, + "NhwcConv_0_out-/conv_in/Conv_output_0.out0_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 0 + }, + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.out7_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 5242880 + }, + "GroupNorm_0.out7_0.out6_0_0_bfp.out7_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 7864320 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 10485760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 10584320 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 10682880 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 10781440 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 10880000 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 11077120 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 11274240 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 11471360 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 11668480 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 12062720 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 12456960 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 12851200 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 13245440 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 13639680 + }, + "/time_embedding/linear_1/Gemm_output_0.out2_3_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 14033920 + }, + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid_out.out14_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 14039040 + }, + "/time_embedding/linear_2/Gemm_output_0.out2_3_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 14044160 + }, + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid_out.out14_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 14049280 + }, + "/down_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 14054400 + }, + "NhwcConv_1_out-/down_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_1_bfp.out1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 14055680 + }, + "/down_blocks.0/resnets.0/Add.out_17_1_0_bfp.out18_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 16677120 + }, + "GroupNorm_1.out7_1.out6_0_1_bfp.out7_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 19298560 + }, + "NhwcConv_2_out-/down_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_2_bfp.out1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 21920000 + }, + "/down_blocks.0/resnets.0/Add_1.out_17_1_1_bfp.out18_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 24541440 + }, + "/down_blocks.0/attentions.0/norm/Add_output_0_NHWC.out6_2_0_bfp.out7_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 27162880 + }, + "/down_blocks.0/attentions.0/Reshape_output_0.out0_0_0_bfp.out1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 29784320 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_0_bfp.out13_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 32405760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_0_bfp.out9_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 35027200 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_1_bfp.out9_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 37648640 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_2_bfp.out9_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 40270080 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_0_bfp.out11_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 42891520 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_2_bfp.out9_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 45512960 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_2_bfp.out18_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 48134400 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_1_bfp.out13_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 50755840 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 53377280 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 55998720 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 61241600 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.out9_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 66484480 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_3_bfp.out9_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 69105920 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_3_bfp.out18_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 71727360 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_2_bfp.out13_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 74348800 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_0_bfp.out9_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 76970240 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_4_bfp.out9_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 87456000 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_1_bfp.out22_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 97941760 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_5_bfp.out9_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 108427520 + }, + "/down_blocks.0/attentions.0/Reshape_1_output_0.out_17_0_0_bfp.out18_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 111048960 + }, + "NhwcConv_4_out-/down_blocks.0/attentions.0/proj_out/Conv_output_0.out0_1_3_bfp.out1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 113670400 + }, + "/down_blocks.0/attentions.0/Add.out_17_1_4_bfp.out18_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 116291840 + }, + "GroupNorm_3.out7_3.out6_0_2_bfp.out7_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 118913280 + }, + "/down_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 121534720 + }, + "NhwcConv_5_out-/down_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_4_bfp.out1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 121536000 + }, + "/down_blocks.0/resnets.1/Add.out_17_1_5_bfp.out18_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 124157440 + }, + "GroupNorm_4.out7_4.out6_0_3_bfp.out7_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 126778880 + }, + "NhwcConv_6_out-/down_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_5_bfp.out1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 129400320 + }, + "/down_blocks.0/resnets.1/Add_1.out_17_1_6_bfp.out18_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 132021760 + }, + "/down_blocks.0/attentions.1/norm/Add_output_0_NHWC.out6_2_1_bfp.out7_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 134643200 + }, + "/down_blocks.0/attentions.1/Reshape_output_0.out0_0_1_bfp.out1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 137264640 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_3_bfp.out13_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 139886080 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_3_bfp.out9_81": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 142507520 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_4_bfp.out9_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 145128960 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_5_bfp.out9_82": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 147750400 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_2_bfp.out11_0_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 150371840 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_6_bfp.out9_83": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 152993280 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_7_bfp.out18_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 155614720 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_4_bfp.out13_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 158236160 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 160857600 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 163479040 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 168721920 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.out9_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 173964800 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_7_bfp.out9_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 176586240 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_8_bfp.out18_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 179207680 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_5_bfp.out13_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 181829120 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_1_bfp.out9_85": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 184450560 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_8_bfp.out9_86": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 194936320 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_2_bfp.out22_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 205422080 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_9_bfp.out9_87": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 215907840 + }, + "/down_blocks.0/attentions.1/Reshape_1_output_0.out_17_0_1_bfp.out18_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 218529280 + }, + "NhwcConv_8_out-/down_blocks.0/attentions.1/proj_out/Conv_output_0.out0_1_6_bfp.out1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 221150720 + }, + "/down_blocks.0/attentions.1/Add.out_17_1_9_bfp.out18_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 223772160 + }, + "NhwcConv_9_out-/down_blocks.0/downsamplers.0/conv/Conv_output_0.out0_1_7_bfp.out1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 226393600 + }, + "GroupNorm_6.out7_6.out6_0_4_bfp.out7_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 320 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 227048960 + }, + "/down_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 227704320 + }, + "NhwcConv_10_out-/down_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_9_bfp.out1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 227706880 + }, + "/down_blocks.1/resnets.0/Add.out_17_1_10_bfp.out18_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 229017600 + }, + "GroupNorm_7.out7_7.out6_0_5_bfp.out7_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 230328320 + }, + "/down_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 231639040 + }, + "/down_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231641600 + }, + "/down_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231646720 + }, + "/down_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231651840 + }, + "/down_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231656960 + }, + "/mid_block/resnets.0/Unsqueeze_1_output_0.out2_0_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231662080 + }, + "/mid_block/resnets.1/Unsqueeze_1_output_0.out2_0_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231667200 + }, + "/up_blocks.0/resnets.0/Unsqueeze_1_output_0.out2_0_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231672320 + }, + "/up_blocks.0/resnets.1/Unsqueeze_1_output_0.out2_0_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231677440 + }, + "/up_blocks.0/resnets.2/Unsqueeze_1_output_0.out2_0_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 231682560 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 231687680 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 232081920 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 232476160 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 232870400 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 233264640 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 160 + ], + "size_in_bytes": 394240, + "op_tensor_size": 394240, + "offset": 233658880 + }, + "/up_blocks.1/resnets.0/Unsqueeze_1_output_0.out2_0_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 234053120 + }, + "/up_blocks.1/resnets.1/Unsqueeze_1_output_0.out2_0_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 234058240 + }, + "/up_blocks.1/resnets.2/Unsqueeze_1_output_0.out2_0_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 1280 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 234063360 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 234068480 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 234265600 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 234462720 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 234659840 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 234856960 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 80 + ], + "size_in_bytes": 197120, + "op_tensor_size": 197120, + "offset": 235054080 + }, + "/up_blocks.2/resnets.0/Unsqueeze_1_output_0.out2_0_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 235251200 + }, + "/up_blocks.2/resnets.1/Unsqueeze_1_output_0.out2_0_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 235253760 + }, + "/up_blocks.2/resnets.2/Unsqueeze_1_output_0.out2_0_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 640 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 235256320 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235258880 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235357440 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235456000 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235554560 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_k/MatMul_output_0.out2_6_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235653120 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_v/MatMul_output_0.out2_6_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 77, + 40 + ], + "size_in_bytes": 98560, + "op_tensor_size": 98560, + "offset": 235751680 + }, + "/up_blocks.3/resnets.0/Unsqueeze_1_output_0.out2_0_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 235850240 + }, + "/up_blocks.3/resnets.1/Unsqueeze_1_output_0.out2_0_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 235851520 + }, + "/up_blocks.3/resnets.2/Unsqueeze_1_output_0.out2_0_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1, + 1, + 320 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 235852800 + }, + "NhwcConv_11_out-/down_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_10_bfp.out1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 235854080 + }, + "NhwcConv_12_out-/down_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_8_bfp.out1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 237164800 + }, + "/down_blocks.1/resnets.0/Add_1.out_17_1_11_bfp.out18_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 238475520 + }, + "/down_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_2_bfp.out7_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 239786240 + }, + "/down_blocks.1/attentions.0/Reshape_output_0.out0_0_2_bfp.out1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 241096960 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_6_bfp.out13_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 242407680 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_6_bfp.out9_89": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 243718400 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_7_bfp.out9_88": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 245029120 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_8_bfp.out9_90": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 246339840 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_4_bfp.out11_0_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 247650560 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_10_bfp.out9_91": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 248961280 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_12_bfp.out18_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 250272000 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_7_bfp.out13_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 251582720 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 252893440 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 254204160 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 256825600 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.out9_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 259447040 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_11_bfp.out9_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 260757760 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_13_bfp.out18_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 262068480 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_8_bfp.out13_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 263379200 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_2_bfp.out9_93": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 264689920 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_12_bfp.out9_94": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 269932800 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_3_bfp.out22_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 275175680 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_13_bfp.out9_95": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 280418560 + }, + "/down_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_2_bfp.out18_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 281729280 + }, + "NhwcConv_14_out-/down_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_11_bfp.out1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 283040000 + }, + "/down_blocks.1/attentions.0/Add.out_17_1_14_bfp.out18_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 284350720 + }, + "GroupNorm_9.out7_9.out6_0_6_bfp.out7_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 285661440 + }, + "NhwcConv_15_out-/down_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_12_bfp.out1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 286972160 + }, + "/down_blocks.1/resnets.1/Add.out_17_1_15_bfp.out18_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 288282880 + }, + "GroupNorm_10.out7_10.out6_0_7_bfp.out7_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 289593600 + }, + "NhwcConv_16_out-/down_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_13_bfp.out1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 290904320 + }, + "/down_blocks.1/resnets.1/Add_1.out_17_1_16_bfp.out18_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 292215040 + }, + "/down_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_3_bfp.out7_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 293525760 + }, + "/down_blocks.1/attentions.1/Reshape_output_0.out0_0_3_bfp.out1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 294836480 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_9_bfp.out13_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 296147200 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_9_bfp.out9_97": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 297457920 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_10_bfp.out9_96": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 298768640 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_11_bfp.out9_98": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 300079360 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_6_bfp.out11_0_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 301390080 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_14_bfp.out9_99": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 302700800 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_17_bfp.out18_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 304011520 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_10_bfp.out13_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 305322240 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 306632960 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 307943680 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 310565120 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.out9_100": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 313186560 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_15_bfp.out9_100": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 314497280 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_18_bfp.out18_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 315808000 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_11_bfp.out13_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 317118720 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_3_bfp.out9_101": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 318429440 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_16_bfp.out9_102": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 323672320 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_4_bfp.out22_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 328915200 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_17_bfp.out9_103": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 334158080 + }, + "/down_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_3_bfp.out18_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 335468800 + }, + "NhwcConv_18_out-/down_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_14_bfp.out1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 336779520 + }, + "/down_blocks.1/attentions.1/Add.out_17_1_19_bfp.out18_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 338090240 + }, + "NhwcConv_19_out-/down_blocks.1/downsamplers.0/conv/Conv_output_0.out0_1_15_bfp.out1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 339400960 + }, + "GroupNorm_12.out7_12.out6_0_8_bfp.out7_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 640 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 339728640 + }, + "NhwcConv_20_out-/down_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_17_bfp.out1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 340056320 + }, + "/down_blocks.2/resnets.0/Add.out_17_1_20_bfp.out18_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 340711680 + }, + "GroupNorm_13.out7_13.out6_0_9_bfp.out7_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 341367040 + }, + "NhwcConv_21_out-/down_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_18_bfp.out1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 342022400 + }, + "NhwcConv_22_out-/down_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_16_bfp.out1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 342677760 + }, + "/down_blocks.2/resnets.0/Add_1.out_17_1_21_bfp.out18_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 343333120 + }, + "/down_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_4_bfp.out7_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 343988480 + }, + "/down_blocks.2/attentions.0/Reshape_output_0.out0_0_4_bfp.out1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 344643840 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_12_bfp.out13_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 345299200 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_12_bfp.out9_105": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 345954560 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_13_bfp.out9_104": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 346609920 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_14_bfp.out9_106": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 347265280 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_8_bfp.out11_0_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 347920640 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_18_bfp.out9_107": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 348576000 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_22_bfp.out18_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 349231360 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_13_bfp.out13_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 349886720 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 350542080 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 351197440 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 352508160 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.out9_108": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 353818880 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_19_bfp.out9_108": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 354474240 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_23_bfp.out18_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 355129600 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_14_bfp.out13_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 355784960 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_4_bfp.out9_109": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 356440320 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_20_bfp.out9_110": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 359061760 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_5_bfp.out22_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 361683200 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_21_bfp.out9_111": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 364304640 + }, + "/down_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_4_bfp.out18_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 364960000 + }, + "NhwcConv_24_out-/down_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_19_bfp.out1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 365615360 + }, + "/down_blocks.2/attentions.0/Add.out_17_1_24_bfp.out18_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 366270720 + }, + "GroupNorm_15.out7_15.out6_0_10_bfp.out7_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 366926080 + }, + "NhwcConv_25_out-/down_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_20_bfp.out1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 367581440 + }, + "/down_blocks.2/resnets.1/Add.out_17_1_25_bfp.out18_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 368236800 + }, + "GroupNorm_16.out7_16.out6_0_11_bfp.out7_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 368892160 + }, + "NhwcConv_26_out-/down_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_21_bfp.out1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 369547520 + }, + "/down_blocks.2/resnets.1/Add_1.out_17_1_26_bfp.out18_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 370202880 + }, + "/down_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_5_bfp.out7_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 370858240 + }, + "/down_blocks.2/attentions.1/Reshape_output_0.out0_0_5_bfp.out1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 371513600 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_15_bfp.out13_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 372168960 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_15_bfp.out9_113": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 372824320 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_16_bfp.out9_112": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 373479680 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_17_bfp.out9_114": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 374135040 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_10_bfp.out11_0_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 374790400 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_22_bfp.out9_115": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 375445760 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_27_bfp.out18_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 376101120 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_16_bfp.out13_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 376756480 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 377411840 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 378067200 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 379377920 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.out9_116": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 380688640 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_23_bfp.out9_116": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 381344000 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_28_bfp.out18_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 381999360 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_17_bfp.out13_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 382654720 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_5_bfp.out9_117": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 383310080 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_24_bfp.out9_118": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 385931520 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_6_bfp.out22_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 388552960 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_25_bfp.out9_119": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 391174400 + }, + "/down_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_5_bfp.out18_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 391829760 + }, + "NhwcConv_28_out-/down_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_22_bfp.out1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 392485120 + }, + "/down_blocks.2/attentions.1/Add.out_17_1_29_bfp.out18_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 393140480 + }, + "NhwcConv_29_out-/down_blocks.2/downsamplers.0/conv/Conv_output_0.out0_1_23_bfp.out1_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 393795840 + }, + "GroupNorm_18.out7_18.out6_0_12_bfp.out7_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 393959680 + }, + "NhwcConv_30_out-/down_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_24_bfp.out1_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394123520 + }, + "/down_blocks.3/resnets.0/Add.out_17_1_30_bfp.out18_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394287360 + }, + "GroupNorm_19.out7_19.out6_0_13_bfp.out7_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394451200 + }, + "NhwcConv_31_out-/down_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_25_bfp.out1_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394615040 + }, + "/down_blocks.3/resnets.0/Add_1.out_17_1_31_bfp.out18_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394778880 + }, + "GroupNorm_20.out7_20.out6_0_14_bfp.out7_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 394942720 + }, + "NhwcConv_32_out-/down_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_26_bfp.out1_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395106560 + }, + "/down_blocks.3/resnets.1/Add.out_17_1_32_bfp.out18_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395270400 + }, + "GroupNorm_21.out7_21.out6_0_15_bfp.out7_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395434240 + }, + "NhwcConv_33_out-/down_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_27_bfp.out1_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395598080 + }, + "/down_blocks.3/resnets.1/Add_1.out_17_1_33_bfp.out18_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395761920 + }, + "GroupNorm_22.out7_22.out6_0_16_bfp.out7_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 395925760 + }, + "NhwcConv_34_out-/mid_block/resnets.0/conv1/Conv_output_0.out0_1_28_bfp.out1_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396089600 + }, + "/mid_block/resnets.0/Add.out_17_1_34_bfp.out18_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396253440 + }, + "GroupNorm_23.out7_23.out6_0_17_bfp.out7_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396417280 + }, + "NhwcConv_35_out-/mid_block/resnets.0/conv2/Conv_output_0.out0_1_29_bfp.out1_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396581120 + }, + "/mid_block/resnets.0/Add_1.out_17_1_35_bfp.out18_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396744960 + }, + "/mid_block/attentions.0/norm/Add_output_0_NHWC.out6_2_6_bfp.out7_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 396908800 + }, + "/mid_block/attentions.0/Reshape_output_0.out0_0_6_bfp.out1_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 397072640 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_18_bfp.out13_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 397236480 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 397400320 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 397564160 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 397728000 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 397891840 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 398219520 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 398547200 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 398874880 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.out9_123": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 399202560 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_26_bfp.out9_123": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 399366400 + }, + "/mid_block/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_36_bfp.out18_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 399530240 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_19_bfp.out13_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 399694080 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 399857920 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 64, + 160 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 400021760 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 400349440 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.out9_124": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 400677120 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_27_bfp.out9_124": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 400840960 + }, + "/mid_block/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_37_bfp.out18_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 401004800 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_20_bfp.out13_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 401168640 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_6_bfp.out9_125": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 401332480 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_28_bfp.out9_126": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 401987840 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_7_bfp.out22_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 5120 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 402643200 + }, + "/mid_block/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_29_bfp.out9_127": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 403298560 + }, + "/mid_block/attentions.0/Reshape_1_output_0.out_17_0_6_bfp.out18_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 403462400 + }, + "NhwcConv_37_out-/mid_block/attentions.0/proj_out/Conv_output_0.out0_1_30_bfp.out1_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 403626240 + }, + "/mid_block/attentions.0/Add.out_17_1_38_bfp.out18_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 403790080 + }, + "GroupNorm_25.out7_25.out6_0_18_bfp.out7_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 403953920 + }, + "NhwcConv_38_out-/mid_block/resnets.1/conv1/Conv_output_0.out0_1_31_bfp.out1_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 404117760 + }, + "/mid_block/resnets.1/Add.out_17_1_39_bfp.out18_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 404281600 + }, + "GroupNorm_26.out7_26.out6_0_19_bfp.out7_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 404445440 + }, + "NhwcConv_39_out-/mid_block/resnets.1/conv2/Conv_output_0.out0_1_32_bfp.out1_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 404609280 + }, + "/mid_block/resnets.1/Add_1.out_17_1_40_bfp.out18_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 404773120 + }, + "/up_blocks.0/Concat.out19_1_bfp.out20_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 404936960 + }, + "GroupNorm_27.out7_27.out6_0_20_bfp.out7_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 405264640 + }, + "NhwcConv_40_out-/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_34_bfp.out1_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 405592320 + }, + "/up_blocks.0/resnets.0/Add.out_17_1_41_bfp.out18_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 405756160 + }, + "GroupNorm_28.out7_28.out6_0_21_bfp.out7_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 405920000 + }, + "NhwcConv_41_out-/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_35_bfp.out1_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 406083840 + }, + "NhwcConv_42_out-/up_blocks.0/resnets.0/conv_shortcut/Conv_output_0.out0_1_33_bfp.out1_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 406247680 + }, + "/up_blocks.0/resnets.0/Add_1.out_17_1_42_bfp.out18_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 406411520 + }, + "/up_blocks.0/Concat_1.out19_2_bfp.out20_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 406575360 + }, + "GroupNorm_29.out7_29.out6_0_22_bfp.out7_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 406903040 + }, + "NhwcConv_43_out-/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_37_bfp.out1_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 407230720 + }, + "/up_blocks.0/resnets.1/Add.out_17_1_43_bfp.out18_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 407394560 + }, + "GroupNorm_30.out7_30.out6_0_23_bfp.out7_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 407558400 + }, + "NhwcConv_44_out-/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_38_bfp.out1_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 407722240 + }, + "NhwcConv_45_out-/up_blocks.0/resnets.1/conv_shortcut/Conv_output_0.out0_1_36_bfp.out1_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 407886080 + }, + "/up_blocks.0/resnets.1/Add_1.out_17_1_44_bfp.out18_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 408049920 + }, + "/up_blocks.0/Concat_2.out19_3_bfp.out20_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 408213760 + }, + "GroupNorm_31.out7_31.out6_0_24_bfp.out7_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 2560 + ], + "size_in_bytes": 327680, + "op_tensor_size": 327680, + "offset": 408541440 + }, + "NhwcConv_46_out-/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_40_bfp.out1_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 408869120 + }, + "/up_blocks.0/resnets.2/Add.out_17_1_45_bfp.out18_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 409032960 + }, + "GroupNorm_32.out7_32.out6_0_25_bfp.out7_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 409196800 + }, + "NhwcConv_47_out-/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_41_bfp.out1_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 409360640 + }, + "NhwcConv_48_out-/up_blocks.0/resnets.2/conv_shortcut/Conv_output_0.out0_1_39_bfp.out1_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 409524480 + }, + "/up_blocks.0/resnets.2/Add_1.out_17_1_46_bfp.out18_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 8, + 1280 + ], + "size_in_bytes": 163840, + "op_tensor_size": 163840, + "offset": 409688320 + }, + "/up_blocks.0/upsamplers.0/Resize_output_0.nhwc5_0.out_3_0_bfp.out4_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 409852160 + }, + "NhwcConv_49_out-/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_42_bfp.out1_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 410507520 + }, + "/up_blocks.1/Concat.out19_4_bfp.out20_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 411162880 + }, + "GroupNorm_33.out7_33.out6_0_26_bfp.out7_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 412473600 + }, + "NhwcConv_50_out-/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_44_bfp.out1_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 413784320 + }, + "/up_blocks.1/resnets.0/Add.out_17_1_47_bfp.out18_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 414439680 + }, + "GroupNorm_34.out7_34.out6_0_27_bfp.out7_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 415095040 + }, + "NhwcConv_51_out-/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_45_bfp.out1_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 415750400 + }, + "NhwcConv_52_out-/up_blocks.1/resnets.0/conv_shortcut/Conv_output_0.out0_1_43_bfp.out1_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 416405760 + }, + "/up_blocks.1/resnets.0/Add_1.out_17_1_48_bfp.out18_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 417061120 + }, + "/up_blocks.1/attentions.0/norm/Add_output_0_NHWC.out6_2_7_bfp.out7_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 417716480 + }, + "/up_blocks.1/attentions.0/Reshape_output_0.out0_0_7_bfp.out1_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 418371840 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_21_bfp.out13_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 419027200 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_21_bfp.out9_129": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 419682560 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_22_bfp.out9_128": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 420337920 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_23_bfp.out9_130": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 420993280 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_14_bfp.out11_0_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 421648640 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_30_bfp.out9_131": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 422304000 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_49_bfp.out18_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 422959360 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_22_bfp.out13_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 423614720 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 424270080 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 424925440 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 426236160 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.out9_132": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 427546880 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_31_bfp.out9_132": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 428202240 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_50_bfp.out18_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 428857600 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_23_bfp.out13_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 429512960 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_7_bfp.out9_133": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 430168320 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_32_bfp.out9_134": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 432789760 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_8_bfp.out22_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 435411200 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_33_bfp.out9_135": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 438032640 + }, + "/up_blocks.1/attentions.0/Reshape_1_output_0.out_17_0_7_bfp.out18_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 438688000 + }, + "NhwcConv_54_out-/up_blocks.1/attentions.0/proj_out/Conv_output_0.out0_1_46_bfp.out1_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 439343360 + }, + "/up_blocks.1/attentions.0/Add.out_17_1_51_bfp.out18_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 439998720 + }, + "/up_blocks.1/Concat_1.out19_5_bfp.out20_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 440654080 + }, + "GroupNorm_36.out7_36.out6_0_28_bfp.out7_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 2560 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 441964800 + }, + "NhwcConv_55_out-/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_48_bfp.out1_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 443275520 + }, + "/up_blocks.1/resnets.1/Add.out_17_1_52_bfp.out18_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 443930880 + }, + "GroupNorm_37.out7_37.out6_0_29_bfp.out7_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 444586240 + }, + "NhwcConv_56_out-/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_49_bfp.out1_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 445241600 + }, + "NhwcConv_57_out-/up_blocks.1/resnets.1/conv_shortcut/Conv_output_0.out0_1_47_bfp.out1_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 445896960 + }, + "/up_blocks.1/resnets.1/Add_1.out_17_1_53_bfp.out18_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 446552320 + }, + "/up_blocks.1/attentions.1/norm/Add_output_0_NHWC.out6_2_8_bfp.out7_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 447207680 + }, + "/up_blocks.1/attentions.1/Reshape_output_0.out0_0_8_bfp.out1_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 447863040 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_24_bfp.out13_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 448518400 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_24_bfp.out9_137": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 449173760 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_25_bfp.out9_136": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 449829120 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_26_bfp.out9_138": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 450484480 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_16_bfp.out11_0_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 451139840 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_34_bfp.out9_139": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 451795200 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_54_bfp.out18_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 452450560 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_25_bfp.out13_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 453105920 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 453761280 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 454416640 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 455727360 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.out9_140": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 457038080 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_35_bfp.out9_140": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 457693440 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_55_bfp.out18_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 458348800 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_26_bfp.out13_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 459004160 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_8_bfp.out9_141": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 459659520 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_36_bfp.out9_142": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 462280960 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_9_bfp.out22_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 464902400 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_37_bfp.out9_143": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 467523840 + }, + "/up_blocks.1/attentions.1/Reshape_1_output_0.out_17_0_8_bfp.out18_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 468179200 + }, + "NhwcConv_59_out-/up_blocks.1/attentions.1/proj_out/Conv_output_0.out0_1_50_bfp.out1_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 468834560 + }, + "/up_blocks.1/attentions.1/Add.out_17_1_56_bfp.out18_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 469489920 + }, + "/up_blocks.1/Concat_2.out19_6_bfp.out20_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1920 + ], + "size_in_bytes": 983040, + "op_tensor_size": 983040, + "offset": 470145280 + }, + "GroupNorm_39.out7_39.out6_0_30_bfp.out7_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1920 + ], + "size_in_bytes": 983040, + "op_tensor_size": 983040, + "offset": 471128320 + }, + "NhwcConv_60_out-/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_52_bfp.out1_61": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 472111360 + }, + "/up_blocks.1/resnets.2/Add.out_17_1_57_bfp.out18_66": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 472766720 + }, + "GroupNorm_40.out7_40.out6_0_31_bfp.out7_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 473422080 + }, + "NhwcConv_61_out-/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_53_bfp.out1_62": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 474077440 + }, + "NhwcConv_62_out-/up_blocks.1/resnets.2/conv_shortcut/Conv_output_0.out0_1_51_bfp.out1_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 474732800 + }, + "/up_blocks.1/resnets.2/Add_1.out_17_1_58_bfp.out18_67": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 475388160 + }, + "/up_blocks.1/attentions.2/norm/Add_output_0_NHWC.out6_2_9_bfp.out7_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 476043520 + }, + "/up_blocks.1/attentions.2/Reshape_output_0.out0_0_9_bfp.out1_63": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 476698880 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_27_bfp.out13_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 477354240 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_27_bfp.out9_145": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 478009600 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_28_bfp.out9_144": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 478664960 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_29_bfp.out9_146": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 479320320 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_18_bfp.out11_0_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 479975680 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_38_bfp.out9_147": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 480631040 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_59_bfp.out18_68": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 481286400 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_28_bfp.out13_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 481941760 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 482597120 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 256, + 160 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 483252480 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 484563200 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.out9_148": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 485873920 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_39_bfp.out9_148": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 486529280 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_60_bfp.out18_69": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 487184640 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_29_bfp.out13_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 487840000 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_9_bfp.out9_149": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 488495360 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_40_bfp.out9_150": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 491116800 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_10_bfp.out22_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 5120 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 493738240 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_41_bfp.out9_151": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 256, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 496359680 + }, + "/up_blocks.1/attentions.2/Reshape_1_output_0.out_17_0_9_bfp.out18_70": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 497015040 + }, + "NhwcConv_64_out-/up_blocks.1/attentions.2/proj_out/Conv_output_0.out0_1_54_bfp.out1_64": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 497670400 + }, + "/up_blocks.1/attentions.2/Add.out_17_1_61_bfp.out18_71": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 16, + 16, + 1280 + ], + "size_in_bytes": 655360, + "op_tensor_size": 655360, + "offset": 498325760 + }, + "/up_blocks.1/upsamplers.0/Resize_output_0.nhwc5_1.out_3_1_bfp.out4_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 498981120 + }, + "NhwcConv_65_out-/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_55_bfp.out1_65": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 501602560 + }, + "/up_blocks.2/Concat.out19_7_bfp.out20_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1920 + ], + "size_in_bytes": 3932160, + "op_tensor_size": 3932160, + "offset": 504224000 + }, + "GroupNorm_42.out7_42.out6_0_32_bfp.out7_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1920 + ], + "size_in_bytes": 3932160, + "op_tensor_size": 3932160, + "offset": 508156160 + }, + "NhwcConv_66_out-/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_57_bfp.out1_67": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 512088320 + }, + "/up_blocks.2/resnets.0/Add.out_17_1_62_bfp.out18_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 513399040 + }, + "GroupNorm_43.out7_43.out6_0_33_bfp.out7_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 514709760 + }, + "NhwcConv_67_out-/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_58_bfp.out1_68": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 516020480 + }, + "NhwcConv_68_out-/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_56_bfp.out1_66": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 517331200 + }, + "/up_blocks.2/resnets.0/Add_1.out_17_1_63_bfp.out18_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 518641920 + }, + "/up_blocks.2/attentions.0/norm/Add_output_0_NHWC.out6_2_10_bfp.out7_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 519952640 + }, + "/up_blocks.2/attentions.0/Reshape_output_0.out0_0_10_bfp.out1_69": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 521263360 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_30_bfp.out13_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 522574080 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_30_bfp.out9_153": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 523884800 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_31_bfp.out9_152": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 525195520 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_32_bfp.out9_154": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 526506240 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_20_bfp.out11_0_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 527816960 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_42_bfp.out9_155": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 529127680 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_64_bfp.out18_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 530438400 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_31_bfp.out13_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 531749120 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 533059840 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 534370560 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 536992000 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.out9_156": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 539613440 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_43_bfp.out9_156": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 540924160 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_65_bfp.out18_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 542234880 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_32_bfp.out13_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 543545600 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_10_bfp.out9_157": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 544856320 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_44_bfp.out9_158": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 550099200 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_11_bfp.out22_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 555342080 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_45_bfp.out9_159": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 560584960 + }, + "/up_blocks.2/attentions.0/Reshape_1_output_0.out_17_0_10_bfp.out18_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 561895680 + }, + "NhwcConv_70_out-/up_blocks.2/attentions.0/proj_out/Conv_output_0.out0_1_59_bfp.out1_70": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 563206400 + }, + "/up_blocks.2/attentions.0/Add.out_17_1_66_bfp.out18_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 564517120 + }, + "/up_blocks.2/Concat_1.out19_8_bfp.out20_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 565827840 + }, + "GroupNorm_45.out7_45.out6_0_34_bfp.out7_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 1280 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 568449280 + }, + "NhwcConv_71_out-/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_61_bfp.out1_72": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 571070720 + }, + "/up_blocks.2/resnets.1/Add.out_17_1_67_bfp.out18_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 572381440 + }, + "GroupNorm_46.out7_46.out6_0_35_bfp.out7_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 573692160 + }, + "NhwcConv_72_out-/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_62_bfp.out1_73": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 575002880 + }, + "NhwcConv_73_out-/up_blocks.2/resnets.1/conv_shortcut/Conv_output_0.out0_1_60_bfp.out1_71": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 576313600 + }, + "/up_blocks.2/resnets.1/Add_1.out_17_1_68_bfp.out18_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 577624320 + }, + "/up_blocks.2/attentions.1/norm/Add_output_0_NHWC.out6_2_11_bfp.out7_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 578935040 + }, + "/up_blocks.2/attentions.1/Reshape_output_0.out0_0_11_bfp.out1_74": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 580245760 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_33_bfp.out13_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 581556480 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_33_bfp.out9_161": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 582867200 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_34_bfp.out9_160": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 584177920 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_35_bfp.out9_162": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 585488640 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_22_bfp.out11_0_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 586799360 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_46_bfp.out9_163": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 588110080 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_69_bfp.out18_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 589420800 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_34_bfp.out13_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 590731520 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 592042240 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 593352960 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 595974400 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.out9_164": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 598595840 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_47_bfp.out9_164": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 599906560 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_70_bfp.out18_81": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 601217280 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_35_bfp.out13_35": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 602528000 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_11_bfp.out9_165": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 603838720 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_48_bfp.out9_166": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 609081600 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_12_bfp.out22_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 614324480 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_49_bfp.out9_167": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 619567360 + }, + "/up_blocks.2/attentions.1/Reshape_1_output_0.out_17_0_11_bfp.out18_82": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 620878080 + }, + "NhwcConv_75_out-/up_blocks.2/attentions.1/proj_out/Conv_output_0.out0_1_63_bfp.out1_75": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 622188800 + }, + "/up_blocks.2/attentions.1/Add.out_17_1_71_bfp.out18_83": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 623499520 + }, + "/up_blocks.2/Concat_2.out19_9_bfp.out20_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 960 + ], + "size_in_bytes": 1966080, + "op_tensor_size": 1966080, + "offset": 624810240 + }, + "GroupNorm_48.out7_48.out6_0_36_bfp.out7_48": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 960 + ], + "size_in_bytes": 1966080, + "op_tensor_size": 1966080, + "offset": 626776320 + }, + "NhwcConv_76_out-/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_65_bfp.out1_77": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 628742400 + }, + "/up_blocks.2/resnets.2/Add.out_17_1_72_bfp.out18_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 630053120 + }, + "GroupNorm_49.out7_49.out6_0_37_bfp.out7_49": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 631363840 + }, + "NhwcConv_77_out-/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_66_bfp.out1_78": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 632674560 + }, + "NhwcConv_78_out-/up_blocks.2/resnets.2/conv_shortcut/Conv_output_0.out0_1_64_bfp.out1_76": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 633985280 + }, + "/up_blocks.2/resnets.2/Add_1.out_17_1_73_bfp.out18_85": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 635296000 + }, + "/up_blocks.2/attentions.2/norm/Add_output_0_NHWC.out6_2_12_bfp.out7_50": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 636606720 + }, + "/up_blocks.2/attentions.2/Reshape_output_0.out0_0_12_bfp.out1_79": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 637917440 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_36_bfp.out13_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 639228160 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_36_bfp.out9_169": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 640538880 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_37_bfp.out9_168": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 641849600 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_38_bfp.out9_170": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 643160320 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_24_bfp.out11_0_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 644471040 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_50_bfp.out9_171": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 645781760 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_74_bfp.out18_86": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 647092480 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_37_bfp.out13_37": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 648403200 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 649713920 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 1024, + 80 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 651024640 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 653646080 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.out9_172": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 656267520 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_51_bfp.out9_172": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 657578240 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_75_bfp.out18_87": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 658888960 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_38_bfp.out13_38": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 660199680 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_12_bfp.out9_173": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 661510400 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_52_bfp.out9_174": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 666753280 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_13_bfp.out22_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 2560 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 671996160 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_53_bfp.out9_175": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 1024, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 677239040 + }, + "/up_blocks.2/attentions.2/Reshape_1_output_0.out_17_0_12_bfp.out18_88": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 678549760 + }, + "NhwcConv_80_out-/up_blocks.2/attentions.2/proj_out/Conv_output_0.out0_1_67_bfp.out1_80": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 679860480 + }, + "/up_blocks.2/attentions.2/Add.out_17_1_76_bfp.out18_89": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 32, + 32, + 640 + ], + "size_in_bytes": 1310720, + "op_tensor_size": 1310720, + "offset": 681171200 + }, + "/up_blocks.2/upsamplers.0/Resize_output_0.nhwc5_2.out_3_2_bfp.out4_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 682481920 + }, + "NhwcConv_81_out-/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_68_bfp.out1_81": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 687724800 + }, + "/up_blocks.3/Concat.out19_10_bfp.out20_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 960 + ], + "size_in_bytes": 7864320, + "op_tensor_size": 7864320, + "offset": 692967680 + }, + "GroupNorm_51.out7_51.out6_0_38_bfp.out7_51": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 960 + ], + "size_in_bytes": 7864320, + "op_tensor_size": 7864320, + "offset": 700832000 + }, + "NhwcConv_82_out-/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_70_bfp.out1_83": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 708696320 + }, + "/up_blocks.3/resnets.0/Add.out_17_1_77_bfp.out18_90": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 711317760 + }, + "GroupNorm_52.out7_52.out6_0_39_bfp.out7_52": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 713939200 + }, + "NhwcConv_83_out-/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_71_bfp.out1_84": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 716560640 + }, + "NhwcConv_84_out-/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_69_bfp.out1_82": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 719182080 + }, + "/up_blocks.3/resnets.0/Add_1.out_17_1_78_bfp.out18_91": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 721803520 + }, + "/up_blocks.3/attentions.0/norm/Add_output_0_NHWC.out6_2_13_bfp.out7_53": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 724424960 + }, + "/up_blocks.3/attentions.0/Reshape_output_0.out0_0_13_bfp.out1_85": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 727046400 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_39_bfp.out13_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 729667840 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_39_bfp.out9_177": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 732289280 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_40_bfp.out9_176": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 734910720 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_41_bfp.out9_178": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 737532160 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out8_26_bfp.out11_0_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 740153600 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_54_bfp.out9_179": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 742775040 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_output_0.out_17_1_79_bfp.out18_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 745396480 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_40_bfp.out13_40": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 748017920 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 750639360 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 753260800 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out8_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 758503680 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.out9_180": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 763746560 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_55_bfp.out9_180": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 766368000 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/Add_1_output_0.out_17_1_80_bfp.out18_93": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 768989440 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_41_bfp.out13_41": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 771610880 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_13_bfp.out9_181": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 774232320 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_56_bfp.out9_182": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 784718080 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_14_bfp.out22_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 795203840 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_57_bfp.out9_183": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 805689600 + }, + "/up_blocks.3/attentions.0/Reshape_1_output_0.out_17_0_13_bfp.out18_94": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 808311040 + }, + "NhwcConv_86_out-/up_blocks.3/attentions.0/proj_out/Conv_output_0.out0_1_72_bfp.out1_86": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 810932480 + }, + "/up_blocks.3/attentions.0/Add.out_17_1_81_bfp.out18_95": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 813553920 + }, + "/up_blocks.3/Concat_1.out19_11_bfp.out20_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 816175360 + }, + "GroupNorm_54.out7_54.out6_0_40_bfp.out7_54": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 821418240 + }, + "NhwcConv_87_out-/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_74_bfp.out1_88": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 826661120 + }, + "/up_blocks.3/resnets.1/Add.out_17_1_82_bfp.out18_96": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 829282560 + }, + "GroupNorm_55.out7_55.out6_0_41_bfp.out7_55": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 831904000 + }, + "NhwcConv_88_out-/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_75_bfp.out1_89": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 834525440 + }, + "NhwcConv_89_out-/up_blocks.3/resnets.1/conv_shortcut/Conv_output_0.out0_1_73_bfp.out1_87": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 837146880 + }, + "/up_blocks.3/resnets.1/Add_1.out_17_1_83_bfp.out18_97": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 839768320 + }, + "/up_blocks.3/attentions.1/norm/Add_output_0_NHWC.out6_2_14_bfp.out7_56": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 842389760 + }, + "/up_blocks.3/attentions.1/Reshape_output_0.out0_0_14_bfp.out1_90": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 845011200 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_42_bfp.out13_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 847632640 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_42_bfp.out9_185": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 850254080 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_43_bfp.out9_184": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 852875520 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_44_bfp.out9_186": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 855496960 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/Reshape_3_output_0.out8_28_bfp.out11_0_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 858118400 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_58_bfp.out9_187": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 860739840 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_output_0.out_17_1_84_bfp.out18_98": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 863361280 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_43_bfp.out13_43": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 865982720 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 868604160 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 871225600 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out8_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 876468480 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.out9_188": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 881711360 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_59_bfp.out9_188": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 884332800 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/Add_1_output_0.out_17_1_85_bfp.out18_99": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 886954240 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_44_bfp.out13_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 889575680 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_14_bfp.out9_189": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 892197120 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_60_bfp.out9_190": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 902682880 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_15_bfp.out22_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 913168640 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_61_bfp.out9_191": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 923654400 + }, + "/up_blocks.3/attentions.1/Reshape_1_output_0.out_17_0_14_bfp.out18_100": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 926275840 + }, + "NhwcConv_91_out-/up_blocks.3/attentions.1/proj_out/Conv_output_0.out0_1_76_bfp.out1_91": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 928897280 + }, + "/up_blocks.3/attentions.1/Add.out_17_1_86_bfp.out18_101": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 931518720 + }, + "/up_blocks.3/Concat_2.out19_12_bfp.out20_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 934140160 + }, + "GroupNorm_57.out7_57.out6_0_42_bfp.out7_57": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 640 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 939383040 + }, + "NhwcConv_92_out-/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_78_bfp.out1_93": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 944625920 + }, + "/up_blocks.3/resnets.2/Add.out_17_1_87_bfp.out18_102": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 947247360 + }, + "GroupNorm_58.out7_58.out6_0_43_bfp.out7_58": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 949868800 + }, + "NhwcConv_93_out-/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_79_bfp.out1_94": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 952490240 + }, + "NhwcConv_94_out-/up_blocks.3/resnets.2/conv_shortcut/Conv_output_0.out0_1_77_bfp.out1_92": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 955111680 + }, + "/up_blocks.3/resnets.2/Add_1.out_17_1_88_bfp.out18_103": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 957733120 + }, + "/up_blocks.3/attentions.2/norm/Add_output_0_NHWC.out6_2_15_bfp.out7_59": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 960354560 + }, + "/up_blocks.3/attentions.2/Reshape_output_0.out0_0_15_bfp.out1_95": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 962976000 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0.out12_45_bfp.out13_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 965597440 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_45_bfp.out9_193": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 968218880 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_46_bfp.out9_192": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 970840320 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_47_bfp.out9_194": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 973461760 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/Reshape_3_output_0.out8_30_bfp.out11_0_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 976083200 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn1/to_out.0/Add_output_0.out2_3_62_bfp.out9_195": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 978704640 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_output_0.out_17_1_89_bfp.out18_104": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 981326080 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm2/LayerNormalization_output_0.out12_46_bfp.out13_46": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 983947520 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 986568960 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 8, + 4096, + 40 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 989190400 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out8_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 994433280 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.out9_196": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 999676160 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_out.0/Add_output_0.out2_3_63_bfp.out9_196": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1002297600 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/Add_1_output_0.out_17_1_90_bfp.out18_105": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1004919040 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/norm3/LayerNormalization_output_0.out12_47_bfp.out13_47": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1007540480 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_3_output_0.out2_2_15_bfp.out9_197": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 1010161920 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Slice_output_0.out2_3_64_bfp.out9_198": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 1020647680 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.0/Mul_4_output_0.out21_16_bfp.out22_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 1280 + ], + "size_in_bytes": 10485760, + "op_tensor_size": 10485760, + "offset": 1031133440 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/ff/net.2/Add_output_0.out2_3_65_bfp.out9_199": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 4096, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1041619200 + }, + "/up_blocks.3/attentions.2/Reshape_1_output_0.out_17_0_15_bfp.out18_106": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1044240640 + }, + "NhwcConv_96_out-/up_blocks.3/attentions.2/proj_out/Conv_output_0.out0_1_80_bfp.out1_96": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1046862080 + }, + "/up_blocks.3/attentions.2/Add.out_17_1_91_bfp.out18_107": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1049483520 + }, + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "uint8", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 2621440, + "op_tensor_size": 2621440, + "offset": 1052104960 + }, + "GroupNorm_60.out7_60.out6_0_44": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 2, + 64, + 64, + 320 + ], + "size_in_bytes": 5242880, + "op_tensor_size": 5242880, + "offset": 1054726400 + }, + "NhwcConv_0_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 31040 + ], + "size_in_bytes": 31040, + "op_tensor_size": 31040, + "offset": 0, + "file_name": "cache/NhwcConv_0-conv_inConv_0.const", + "file_size": 31040 + }, + "NhwcConv_0_out-/conv_in/Conv_output_0.out6_0_0_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 31040, + "file_name": "cache/NhwcConv_0-conv_inConv_1.const", + "file_size": 128 + }, + "GroupNorm_0_wts_6_0_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 31168, + "file_name": "cache/NhwcConv_0-conv_inConv_2.const", + "file_size": 1280 + }, + "onnx::MatMul_5660": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 32448, + "file_name": "cache/NhwcConv_0-conv_inConv_3.const", + "file_size": 281600 + }, + "onnx::MatMul_5661": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 314048, + "file_name": "cache/NhwcConv_0-conv_inConv_4.const", + "file_size": 281600 + }, + "onnx::MatMul_5690": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 595648, + "file_name": "cache/NhwcConv_0-conv_inConv_5.const", + "file_size": 281600 + }, + "onnx::MatMul_5691": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 877248, + "file_name": "cache/NhwcConv_0-conv_inConv_6.const", + "file_size": 281600 + }, + "onnx::MatMul_5720": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 1158848, + "file_name": "cache/NhwcConv_0-conv_inConv_7.const", + "file_size": 563200 + }, + "onnx::MatMul_5721": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 1722048, + "file_name": "cache/NhwcConv_0-conv_inConv_8.const", + "file_size": 563200 + }, + "onnx::MatMul_5750": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 2285248, + "file_name": "cache/NhwcConv_0-conv_inConv_9.const", + "file_size": 563200 + }, + "onnx::MatMul_5751": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 2848448, + "file_name": "cache/NhwcConv_0-conv_inConv_10.const", + "file_size": 563200 + }, + "onnx::MatMul_5780": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 3411648, + "file_name": "cache/NhwcConv_0-conv_inConv_11.const", + "file_size": 1121280 + }, + "onnx::MatMul_5781": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 4532928, + "file_name": "cache/NhwcConv_0-conv_inConv_12.const", + "file_size": 1121280 + }, + "onnx::MatMul_5810": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 5654208, + "file_name": "cache/NhwcConv_0-conv_inConv_13.const", + "file_size": 1121280 + }, + "onnx::MatMul_5811": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 6775488, + "file_name": "cache/NhwcConv_0-conv_inConv_14.const", + "file_size": 1121280 + }, + "onnx::MatMul_5848": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 7896768, + "file_name": "cache/NhwcConv_0-conv_inConv_15.const", + "file_size": 1121280 + }, + "onnx::MatMul_5849": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 9018048, + "file_name": "cache/NhwcConv_0-conv_inConv_16.const", + "file_size": 1121280 + }, + "time_embedding.linear_1.weight_11_1_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 10139328, + "file_name": "cache/NhwcConv_0-conv_inConv_17.const", + "file_size": 471040 + }, + "/time_embedding/act/Mul/QuickGeluFusion/_sigmoid.weights14_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "op_tensor_size": 256, + "offset": 10610368, + "file_name": "cache/NhwcConv_0-conv_inConv_18.const", + "file_size": 256 + }, + "time_embedding.linear_2.weight_11_1_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 10610624, + "file_name": "cache/NhwcConv_0-conv_inConv_19.const", + "file_size": 1868800 + }, + "/down_blocks.0/resnets.0/act_1/Mul/QuickGeluFusion/_sigmoid.weights14_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "op_tensor_size": 256, + "offset": 12479424, + "file_name": "cache/NhwcConv_0-conv_inConv_20.const", + "file_size": 256 + }, + "down_blocks.0.resnets.0.time_emb_proj.weight_11_1_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "op_tensor_size": 467200, + "offset": 12479680, + "file_name": "cache/NhwcConv_0-conv_inConv_21.const", + "file_size": 467200 + }, + "NhwcConv_1_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 12946880, + "file_name": "cache/NhwcConv_0-conv_inConv_22.const", + "file_size": 1077760 + }, + "GroupNorm_1_wts_6_0_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 14024640, + "file_name": "cache/NhwcConv_0-conv_inConv_23.const", + "file_size": 1280 + }, + "NhwcConv_2_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 14025920, + "file_name": "cache/NhwcConv_0-conv_inConv_24.const", + "file_size": 1077760 + }, + "GroupNorm_2_wts_6_2_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 15103680, + "file_name": "cache/NhwcConv_0-conv_inConv_25.const", + "file_size": 1280 + }, + "NhwcConv_3_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 15104960, + "file_name": "cache/NhwcConv_0-conv_inConv_26.const", + "file_size": 125440 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15230400, + "file_name": "cache/NhwcConv_0-conv_inConv_27.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15231040, + "file_name": "cache/NhwcConv_0-conv_inConv_28.const", + "file_size": 640 + }, + "Attention_0_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 15231680, + "file_name": "cache/NhwcConv_0-conv_inConv_29.const", + "file_size": 118400 + }, + "Attention_0_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 15350080, + "file_name": "cache/NhwcConv_0-conv_inConv_30.const", + "file_size": 118400 + }, + "Attention_0_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 15468480, + "file_name": "cache/NhwcConv_0-conv_inConv_31.const", + "file_size": 118400 + }, + "onnx::MatMul_5658_11_0_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 15586880, + "file_name": "cache/NhwcConv_0-conv_inConv_32.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15704640, + "file_name": "cache/NhwcConv_0-conv_inConv_33.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15705280, + "file_name": "cache/NhwcConv_0-conv_inConv_34.const", + "file_size": 640 + }, + "onnx::MatMul_5659": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 15705920, + "file_name": "cache/NhwcConv_0-conv_inConv_35.const", + "file_size": 118400 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_32_bfp.out9_0_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 15824320, + "file_name": "cache/NhwcConv_0-conv_inConv_36.const", + "file_size": 128 + }, + "/down_blocks.0/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_3_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 15824448, + "file_name": "cache/NhwcConv_0-conv_inConv_37.const", + "file_size": 128 + }, + "onnx::MatMul_5669_11_0_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 15824576, + "file_name": "cache/NhwcConv_0-conv_inConv_38.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15942336, + "file_name": "cache/NhwcConv_0-conv_inConv_39.const", + "file_size": 640 + }, + "down_blocks.0.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 15942976, + "file_name": "cache/NhwcConv_0-conv_inConv_40.const", + "file_size": 640 + }, + "onnx::MatMul_5670_11_0_2_12_0_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 15943616, + "file_name": "cache/NhwcConv_0-conv_inConv_41.const", + "file_size": 471040 + }, + "onnx::MatMul_5670_11_0_2_12_0_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 16414656, + "file_name": "cache/NhwcConv_0-conv_inConv_42.const", + "file_size": 471040 + }, + "onnx::MatMul_5671_11_0_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 16885696, + "file_name": "cache/NhwcConv_0-conv_inConv_43.const", + "file_size": 471040 + }, + "NhwcConv_4_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 17356736, + "file_name": "cache/NhwcConv_0-conv_inConv_44.const", + "file_size": 125440 + }, + "GroupNorm_3_wts_6_0_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 17482176, + "file_name": "cache/NhwcConv_0-conv_inConv_45.const", + "file_size": 1280 + }, + "down_blocks.0.resnets.1.time_emb_proj.weight_11_1_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "op_tensor_size": 467200, + "offset": 17483456, + "file_name": "cache/NhwcConv_0-conv_inConv_46.const", + "file_size": 467200 + }, + "NhwcConv_5_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 17950656, + "file_name": "cache/NhwcConv_0-conv_inConv_47.const", + "file_size": 1077760 + }, + "GroupNorm_4_wts_6_0_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 19028416, + "file_name": "cache/NhwcConv_0-conv_inConv_48.const", + "file_size": 1280 + }, + "NhwcConv_6_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 19029696, + "file_name": "cache/NhwcConv_0-conv_inConv_49.const", + "file_size": 1077760 + }, + "GroupNorm_5_wts_6_2_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 20107456, + "file_name": "cache/NhwcConv_0-conv_inConv_50.const", + "file_size": 1280 + }, + "NhwcConv_7_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 20108736, + "file_name": "cache/NhwcConv_0-conv_inConv_51.const", + "file_size": 125440 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20234176, + "file_name": "cache/NhwcConv_0-conv_inConv_52.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20234816, + "file_name": "cache/NhwcConv_0-conv_inConv_53.const", + "file_size": 640 + }, + "Attention_1_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 20235456, + "file_name": "cache/NhwcConv_0-conv_inConv_54.const", + "file_size": 118400 + }, + "Attention_1_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 20353856, + "file_name": "cache/NhwcConv_0-conv_inConv_55.const", + "file_size": 118400 + }, + "Attention_1_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 20472256, + "file_name": "cache/NhwcConv_0-conv_inConv_56.const", + "file_size": 118400 + }, + "onnx::MatMul_5688_11_0_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 20590656, + "file_name": "cache/NhwcConv_0-conv_inConv_57.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20708416, + "file_name": "cache/NhwcConv_0-conv_inConv_58.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20709056, + "file_name": "cache/NhwcConv_0-conv_inConv_59.const", + "file_size": 640 + }, + "onnx::MatMul_5689": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 20709696, + "file_name": "cache/NhwcConv_0-conv_inConv_60.const", + "file_size": 118400 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_33_bfp.out9_3_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 20828096, + "file_name": "cache/NhwcConv_0-conv_inConv_61.const", + "file_size": 128 + }, + "/down_blocks.0/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_7_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 20828224, + "file_name": "cache/NhwcConv_0-conv_inConv_62.const", + "file_size": 128 + }, + "onnx::MatMul_5699_11_0_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 20828352, + "file_name": "cache/NhwcConv_0-conv_inConv_63.const", + "file_size": 117760 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20946112, + "file_name": "cache/NhwcConv_0-conv_inConv_64.const", + "file_size": 640 + }, + "down_blocks.0.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 20946752, + "file_name": "cache/NhwcConv_0-conv_inConv_65.const", + "file_size": 640 + }, + "onnx::MatMul_5700_11_0_6_12_1_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 20947392, + "file_name": "cache/NhwcConv_0-conv_inConv_66.const", + "file_size": 471040 + }, + "onnx::MatMul_5700_11_0_6_12_1_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 21418432, + "file_name": "cache/NhwcConv_0-conv_inConv_67.const", + "file_size": 471040 + }, + "onnx::MatMul_5701_11_0_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 21889472, + "file_name": "cache/NhwcConv_0-conv_inConv_68.const", + "file_size": 471040 + }, + "NhwcConv_8_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 22360512, + "file_name": "cache/NhwcConv_0-conv_inConv_69.const", + "file_size": 125440 + }, + "NhwcConv_9_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1062400 + ], + "size_in_bytes": 1062400, + "op_tensor_size": 1062400, + "offset": 22485952, + "file_name": "cache/NhwcConv_0-conv_inConv_70.const", + "file_size": 1062400 + }, + "GroupNorm_6_wts_6_0_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 23548352, + "file_name": "cache/NhwcConv_0-conv_inConv_71.const", + "file_size": 1280 + }, + "down_blocks.1.resnets.0.time_emb_proj.weight_11_1_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "op_tensor_size": 934400, + "offset": 23549632, + "file_name": "cache/NhwcConv_0-conv_inConv_72.const", + "file_size": 934400 + }, + "NhwcConv_10_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2155520 + ], + "size_in_bytes": 2155520, + "op_tensor_size": 2155520, + "offset": 24484032, + "file_name": "cache/NhwcConv_0-conv_inConv_73.const", + "file_size": 2155520 + }, + "GroupNorm_7_wts_6_0_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 26639552, + "file_name": "cache/NhwcConv_0-conv_inConv_74.const", + "file_size": 2560 + }, + "down_blocks.1.resnets.1.time_emb_proj.weight_11_1_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "op_tensor_size": 934400, + "offset": 26642112, + "file_name": "cache/NhwcConv_0-conv_inConv_75.const", + "file_size": 934400 + }, + "down_blocks.2.resnets.0.time_emb_proj.weight_11_1_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 27576512, + "file_name": "cache/NhwcConv_0-conv_inConv_76.const", + "file_size": 1868800 + }, + "down_blocks.2.resnets.1.time_emb_proj.weight_11_1_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 29445312, + "file_name": "cache/NhwcConv_0-conv_inConv_77.const", + "file_size": 1868800 + }, + "down_blocks.3.resnets.0.time_emb_proj.weight_11_1_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 31314112, + "file_name": "cache/NhwcConv_0-conv_inConv_78.const", + "file_size": 1868800 + }, + "down_blocks.3.resnets.1.time_emb_proj.weight_11_1_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 33182912, + "file_name": "cache/NhwcConv_0-conv_inConv_79.const", + "file_size": 1868800 + }, + "mid_block.resnets.0.time_emb_proj.weight_11_1_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 35051712, + "file_name": "cache/NhwcConv_0-conv_inConv_80.const", + "file_size": 1868800 + }, + "mid_block.resnets.1.time_emb_proj.weight_11_1_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 36920512, + "file_name": "cache/NhwcConv_0-conv_inConv_81.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.0.time_emb_proj.weight_11_1_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 38789312, + "file_name": "cache/NhwcConv_0-conv_inConv_82.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.1.time_emb_proj.weight_11_1_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 40658112, + "file_name": "cache/NhwcConv_0-conv_inConv_83.const", + "file_size": 1868800 + }, + "up_blocks.0.resnets.2.time_emb_proj.weight_11_1_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 42526912, + "file_name": "cache/NhwcConv_0-conv_inConv_84.const", + "file_size": 1868800 + }, + "onnx::MatMul_5895": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 44395712, + "file_name": "cache/NhwcConv_0-conv_inConv_85.const", + "file_size": 1121280 + }, + "onnx::MatMul_5896": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 45516992, + "file_name": "cache/NhwcConv_0-conv_inConv_86.const", + "file_size": 1121280 + }, + "onnx::MatMul_5925": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 46638272, + "file_name": "cache/NhwcConv_0-conv_inConv_87.const", + "file_size": 1121280 + }, + "onnx::MatMul_5926": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 47759552, + "file_name": "cache/NhwcConv_0-conv_inConv_88.const", + "file_size": 1121280 + }, + "onnx::MatMul_5955": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 48880832, + "file_name": "cache/NhwcConv_0-conv_inConv_89.const", + "file_size": 1121280 + }, + "onnx::MatMul_5956": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1121280 + ], + "size_in_bytes": 1121280, + "op_tensor_size": 1121280, + "offset": 50002112, + "file_name": "cache/NhwcConv_0-conv_inConv_90.const", + "file_size": 1121280 + }, + "up_blocks.1.resnets.0.time_emb_proj.weight_11_1_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 51123392, + "file_name": "cache/NhwcConv_0-conv_inConv_91.const", + "file_size": 1868800 + }, + "up_blocks.1.resnets.1.time_emb_proj.weight_11_1_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 52992192, + "file_name": "cache/NhwcConv_0-conv_inConv_92.const", + "file_size": 1868800 + }, + "up_blocks.1.resnets.2.time_emb_proj.weight_11_1_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 54860992, + "file_name": "cache/NhwcConv_0-conv_inConv_93.const", + "file_size": 1868800 + }, + "onnx::MatMul_5986": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 56729792, + "file_name": "cache/NhwcConv_0-conv_inConv_94.const", + "file_size": 563200 + }, + "onnx::MatMul_5987": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 57292992, + "file_name": "cache/NhwcConv_0-conv_inConv_95.const", + "file_size": 563200 + }, + "onnx::MatMul_6016": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 57856192, + "file_name": "cache/NhwcConv_0-conv_inConv_96.const", + "file_size": 563200 + }, + "onnx::MatMul_6017": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 58419392, + "file_name": "cache/NhwcConv_0-conv_inConv_97.const", + "file_size": 563200 + }, + "onnx::MatMul_6046": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 58982592, + "file_name": "cache/NhwcConv_0-conv_inConv_98.const", + "file_size": 563200 + }, + "onnx::MatMul_6047": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 563200 + ], + "size_in_bytes": 563200, + "op_tensor_size": 563200, + "offset": 59545792, + "file_name": "cache/NhwcConv_0-conv_inConv_99.const", + "file_size": 563200 + }, + "up_blocks.2.resnets.0.time_emb_proj.weight_11_1_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "op_tensor_size": 934400, + "offset": 60108992, + "file_name": "cache/NhwcConv_0-conv_inConv_100.const", + "file_size": 934400 + }, + "up_blocks.2.resnets.1.time_emb_proj.weight_11_1_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "op_tensor_size": 934400, + "offset": 61043392, + "file_name": "cache/NhwcConv_0-conv_inConv_101.const", + "file_size": 934400 + }, + "up_blocks.2.resnets.2.time_emb_proj.weight_11_1_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 934400 + ], + "size_in_bytes": 934400, + "op_tensor_size": 934400, + "offset": 61977792, + "file_name": "cache/NhwcConv_0-conv_inConv_102.const", + "file_size": 934400 + }, + "onnx::MatMul_6077": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 62912192, + "file_name": "cache/NhwcConv_0-conv_inConv_103.const", + "file_size": 281600 + }, + "onnx::MatMul_6078": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 63193792, + "file_name": "cache/NhwcConv_0-conv_inConv_104.const", + "file_size": 281600 + }, + "onnx::MatMul_6107": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 63475392, + "file_name": "cache/NhwcConv_0-conv_inConv_105.const", + "file_size": 281600 + }, + "onnx::MatMul_6108": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 63756992, + "file_name": "cache/NhwcConv_0-conv_inConv_106.const", + "file_size": 281600 + }, + "onnx::MatMul_6137": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 64038592, + "file_name": "cache/NhwcConv_0-conv_inConv_107.const", + "file_size": 281600 + }, + "onnx::MatMul_6138": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 281600 + ], + "size_in_bytes": 281600, + "op_tensor_size": 281600, + "offset": 64320192, + "file_name": "cache/NhwcConv_0-conv_inConv_108.const", + "file_size": 281600 + }, + "up_blocks.3.resnets.0.time_emb_proj.weight_11_1_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "op_tensor_size": 467200, + "offset": 64601792, + "file_name": "cache/NhwcConv_0-conv_inConv_109.const", + "file_size": 467200 + }, + "up_blocks.3.resnets.1.time_emb_proj.weight_11_1_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "op_tensor_size": 467200, + "offset": 65068992, + "file_name": "cache/NhwcConv_0-conv_inConv_110.const", + "file_size": 467200 + }, + "up_blocks.3.resnets.2.time_emb_proj.weight_11_1_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 467200 + ], + "size_in_bytes": 467200, + "op_tensor_size": 467200, + "offset": 65536192, + "file_name": "cache/NhwcConv_0-conv_inConv_111.const", + "file_size": 467200 + }, + "NhwcConv_11_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 66003392, + "file_name": "cache/NhwcConv_0-conv_inConv_112.const", + "file_size": 4311040 + }, + "NhwcConv_12_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 250880 + ], + "size_in_bytes": 250880, + "op_tensor_size": 250880, + "offset": 70314432, + "file_name": "cache/NhwcConv_0-conv_inConv_113.const", + "file_size": 250880 + }, + "GroupNorm_8_wts_6_2_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 70565312, + "file_name": "cache/NhwcConv_0-conv_inConv_114.const", + "file_size": 2560 + }, + "NhwcConv_13_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 70567872, + "file_name": "cache/NhwcConv_0-conv_inConv_115.const", + "file_size": 501760 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 71069632, + "file_name": "cache/NhwcConv_0-conv_inConv_116.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 71070912, + "file_name": "cache/NhwcConv_0-conv_inConv_117.const", + "file_size": 1280 + }, + "Attention_2_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 71072192, + "file_name": "cache/NhwcConv_0-conv_inConv_118.const", + "file_size": 473600 + }, + "Attention_2_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 71545792, + "file_name": "cache/NhwcConv_0-conv_inConv_119.const", + "file_size": 473600 + }, + "Attention_2_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 72019392, + "file_name": "cache/NhwcConv_0-conv_inConv_120.const", + "file_size": 473600 + }, + "onnx::MatMul_5718_11_0_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 72492992, + "file_name": "cache/NhwcConv_0-conv_inConv_121.const", + "file_size": 473600 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 72966592, + "file_name": "cache/NhwcConv_0-conv_inConv_122.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 72967872, + "file_name": "cache/NhwcConv_0-conv_inConv_123.const", + "file_size": 1280 + }, + "onnx::MatMul_5719": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 72969152, + "file_name": "cache/NhwcConv_0-conv_inConv_124.const", + "file_size": 473600 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_34_bfp.out9_6_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 73442752, + "file_name": "cache/NhwcConv_0-conv_inConv_125.const", + "file_size": 128 + }, + "/down_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_11_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 73442880, + "file_name": "cache/NhwcConv_0-conv_inConv_126.const", + "file_size": 128 + }, + "onnx::MatMul_5729_11_0_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 73443008, + "file_name": "cache/NhwcConv_0-conv_inConv_127.const", + "file_size": 473600 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 73916608, + "file_name": "cache/NhwcConv_0-conv_inConv_128.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 73917888, + "file_name": "cache/NhwcConv_0-conv_inConv_129.const", + "file_size": 1280 + }, + "onnx::MatMul_5730_11_0_10_12_2_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 73919168, + "file_name": "cache/NhwcConv_0-conv_inConv_130.const", + "file_size": 1868800 + }, + "onnx::MatMul_5730_11_0_10_12_2_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 75787968, + "file_name": "cache/NhwcConv_0-conv_inConv_131.const", + "file_size": 1868800 + }, + "onnx::MatMul_5731_11_0_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "op_tensor_size": 1884160, + "offset": 77656768, + "file_name": "cache/NhwcConv_0-conv_inConv_132.const", + "file_size": 1884160 + }, + "NhwcConv_14_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 79540928, + "file_name": "cache/NhwcConv_0-conv_inConv_133.const", + "file_size": 501760 + }, + "GroupNorm_9_wts_6_0_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 80042688, + "file_name": "cache/NhwcConv_0-conv_inConv_134.const", + "file_size": 2560 + }, + "NhwcConv_15_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 80045248, + "file_name": "cache/NhwcConv_0-conv_inConv_135.const", + "file_size": 4311040 + }, + "GroupNorm_10_wts_6_0_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 84356288, + "file_name": "cache/NhwcConv_0-conv_inConv_136.const", + "file_size": 2560 + }, + "NhwcConv_16_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 84358848, + "file_name": "cache/NhwcConv_0-conv_inConv_137.const", + "file_size": 4311040 + }, + "GroupNorm_11_wts_6_2_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 88669888, + "file_name": "cache/NhwcConv_0-conv_inConv_138.const", + "file_size": 2560 + }, + "NhwcConv_17_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 88672448, + "file_name": "cache/NhwcConv_0-conv_inConv_139.const", + "file_size": 501760 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 89174208, + "file_name": "cache/NhwcConv_0-conv_inConv_140.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 89175488, + "file_name": "cache/NhwcConv_0-conv_inConv_141.const", + "file_size": 1280 + }, + "Attention_3_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 89176768, + "file_name": "cache/NhwcConv_0-conv_inConv_142.const", + "file_size": 473600 + }, + "Attention_3_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 89650368, + "file_name": "cache/NhwcConv_0-conv_inConv_143.const", + "file_size": 473600 + }, + "Attention_3_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 90123968, + "file_name": "cache/NhwcConv_0-conv_inConv_144.const", + "file_size": 473600 + }, + "onnx::MatMul_5748_11_0_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 90597568, + "file_name": "cache/NhwcConv_0-conv_inConv_145.const", + "file_size": 473600 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 91071168, + "file_name": "cache/NhwcConv_0-conv_inConv_146.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 91072448, + "file_name": "cache/NhwcConv_0-conv_inConv_147.const", + "file_size": 1280 + }, + "onnx::MatMul_5749": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 91073728, + "file_name": "cache/NhwcConv_0-conv_inConv_148.const", + "file_size": 473600 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_35_bfp.out9_9_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 91547328, + "file_name": "cache/NhwcConv_0-conv_inConv_149.const", + "file_size": 128 + }, + "/down_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_15_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 91547456, + "file_name": "cache/NhwcConv_0-conv_inConv_150.const", + "file_size": 128 + }, + "onnx::MatMul_5759_11_0_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 91547584, + "file_name": "cache/NhwcConv_0-conv_inConv_151.const", + "file_size": 473600 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 92021184, + "file_name": "cache/NhwcConv_0-conv_inConv_152.const", + "file_size": 1280 + }, + "down_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 92022464, + "file_name": "cache/NhwcConv_0-conv_inConv_153.const", + "file_size": 1280 + }, + "onnx::MatMul_5760_11_0_14_12_3_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 92023744, + "file_name": "cache/NhwcConv_0-conv_inConv_154.const", + "file_size": 1868800 + }, + "onnx::MatMul_5760_11_0_14_12_3_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 93892544, + "file_name": "cache/NhwcConv_0-conv_inConv_155.const", + "file_size": 1868800 + }, + "onnx::MatMul_5761_11_0_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "op_tensor_size": 1884160, + "offset": 95761344, + "file_name": "cache/NhwcConv_0-conv_inConv_156.const", + "file_size": 1884160 + }, + "NhwcConv_18_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 97645504, + "file_name": "cache/NhwcConv_0-conv_inConv_157.const", + "file_size": 501760 + }, + "NhwcConv_19_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4249600 + ], + "size_in_bytes": 4249600, + "op_tensor_size": 4249600, + "offset": 98147264, + "file_name": "cache/NhwcConv_0-conv_inConv_158.const", + "file_size": 4249600 + }, + "GroupNorm_12_wts_6_0_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 102396864, + "file_name": "cache/NhwcConv_0-conv_inConv_159.const", + "file_size": 2560 + }, + "NhwcConv_20_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 8458240 + ], + "size_in_bytes": 8458240, + "op_tensor_size": 8458240, + "offset": 102399424, + "file_name": "cache/NhwcConv_0-conv_inConv_160.const", + "file_size": 8458240 + }, + "GroupNorm_13_wts_6_0_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 110857664, + "file_name": "cache/NhwcConv_0-conv_inConv_161.const", + "file_size": 5120 + }, + "NhwcConv_21_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 110862784, + "file_name": "cache/NhwcConv_0-conv_inConv_162.const", + "file_size": 16916480 + }, + "NhwcConv_22_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1003520 + ], + "size_in_bytes": 1003520, + "op_tensor_size": 1003520, + "offset": 127779264, + "file_name": "cache/NhwcConv_0-conv_inConv_163.const", + "file_size": 1003520 + }, + "GroupNorm_14_wts_6_2_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 128782784, + "file_name": "cache/NhwcConv_0-conv_inConv_164.const", + "file_size": 5120 + }, + "NhwcConv_23_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 128787904, + "file_name": "cache/NhwcConv_0-conv_inConv_165.const", + "file_size": 2007040 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 130794944, + "file_name": "cache/NhwcConv_0-conv_inConv_166.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 130797504, + "file_name": "cache/NhwcConv_0-conv_inConv_167.const", + "file_size": 2560 + }, + "Attention_4_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 130800064, + "file_name": "cache/NhwcConv_0-conv_inConv_168.const", + "file_size": 1868800 + }, + "Attention_4_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 132668864, + "file_name": "cache/NhwcConv_0-conv_inConv_169.const", + "file_size": 1868800 + }, + "Attention_4_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 134537664, + "file_name": "cache/NhwcConv_0-conv_inConv_170.const", + "file_size": 1868800 + }, + "onnx::MatMul_5778_11_0_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 136406464, + "file_name": "cache/NhwcConv_0-conv_inConv_171.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 138275264, + "file_name": "cache/NhwcConv_0-conv_inConv_172.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 138277824, + "file_name": "cache/NhwcConv_0-conv_inConv_173.const", + "file_size": 2560 + }, + "onnx::MatMul_5779": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 138280384, + "file_name": "cache/NhwcConv_0-conv_inConv_174.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_36_bfp.out9_12_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 140149184, + "file_name": "cache/NhwcConv_0-conv_inConv_175.const", + "file_size": 128 + }, + "/down_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_19_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 140149312, + "file_name": "cache/NhwcConv_0-conv_inConv_176.const", + "file_size": 128 + }, + "onnx::MatMul_5789_11_0_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 140149440, + "file_name": "cache/NhwcConv_0-conv_inConv_177.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 142018240, + "file_name": "cache/NhwcConv_0-conv_inConv_178.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 142020800, + "file_name": "cache/NhwcConv_0-conv_inConv_179.const", + "file_size": 2560 + }, + "onnx::MatMul_5790_11_0_18_12_4_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 142023360, + "file_name": "cache/NhwcConv_0-conv_inConv_180.const", + "file_size": 7475200 + }, + "onnx::MatMul_5790_11_0_18_12_4_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 149498560, + "file_name": "cache/NhwcConv_0-conv_inConv_181.const", + "file_size": 7475200 + }, + "onnx::MatMul_5791_11_0_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 156973760, + "file_name": "cache/NhwcConv_0-conv_inConv_182.const", + "file_size": 7475200 + }, + "NhwcConv_24_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 164448960, + "file_name": "cache/NhwcConv_0-conv_inConv_183.const", + "file_size": 2007040 + }, + "GroupNorm_15_wts_6_0_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 166456000, + "file_name": "cache/NhwcConv_0-conv_inConv_184.const", + "file_size": 5120 + }, + "NhwcConv_25_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 166461120, + "file_name": "cache/NhwcConv_0-conv_inConv_185.const", + "file_size": 16916480 + }, + "GroupNorm_16_wts_6_0_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 183377600, + "file_name": "cache/NhwcConv_0-conv_inConv_186.const", + "file_size": 5120 + }, + "NhwcConv_26_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 183382720, + "file_name": "cache/NhwcConv_0-conv_inConv_187.const", + "file_size": 16916480 + }, + "GroupNorm_17_wts_6_2_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 200299200, + "file_name": "cache/NhwcConv_0-conv_inConv_188.const", + "file_size": 5120 + }, + "NhwcConv_27_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 200304320, + "file_name": "cache/NhwcConv_0-conv_inConv_189.const", + "file_size": 2007040 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 202311360, + "file_name": "cache/NhwcConv_0-conv_inConv_190.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 202313920, + "file_name": "cache/NhwcConv_0-conv_inConv_191.const", + "file_size": 2560 + }, + "Attention_5_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 202316480, + "file_name": "cache/NhwcConv_0-conv_inConv_192.const", + "file_size": 1868800 + }, + "Attention_5_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 204185280, + "file_name": "cache/NhwcConv_0-conv_inConv_193.const", + "file_size": 1868800 + }, + "Attention_5_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 206054080, + "file_name": "cache/NhwcConv_0-conv_inConv_194.const", + "file_size": 1868800 + }, + "onnx::MatMul_5808_11_0_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 207922880, + "file_name": "cache/NhwcConv_0-conv_inConv_195.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 209791680, + "file_name": "cache/NhwcConv_0-conv_inConv_196.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 209794240, + "file_name": "cache/NhwcConv_0-conv_inConv_197.const", + "file_size": 2560 + }, + "onnx::MatMul_5809": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 209796800, + "file_name": "cache/NhwcConv_0-conv_inConv_198.const", + "file_size": 1868800 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_37_bfp.out9_15_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 211665600, + "file_name": "cache/NhwcConv_0-conv_inConv_199.const", + "file_size": 128 + }, + "/down_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_23_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 211665728, + "file_name": "cache/NhwcConv_0-conv_inConv_200.const", + "file_size": 128 + }, + "onnx::MatMul_5819_11_0_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 211665856, + "file_name": "cache/NhwcConv_0-conv_inConv_201.const", + "file_size": 1868800 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 213534656, + "file_name": "cache/NhwcConv_0-conv_inConv_202.const", + "file_size": 2560 + }, + "down_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 213537216, + "file_name": "cache/NhwcConv_0-conv_inConv_203.const", + "file_size": 2560 + }, + "onnx::MatMul_5820_11_0_22_12_5_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 213539776, + "file_name": "cache/NhwcConv_0-conv_inConv_204.const", + "file_size": 7475200 + }, + "onnx::MatMul_5820_11_0_22_12_5_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 221014976, + "file_name": "cache/NhwcConv_0-conv_inConv_205.const", + "file_size": 7475200 + }, + "onnx::MatMul_5821_11_0_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 228490176, + "file_name": "cache/NhwcConv_0-conv_inConv_206.const", + "file_size": 7475200 + }, + "NhwcConv_28_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 235965376, + "file_name": "cache/NhwcConv_0-conv_inConv_207.const", + "file_size": 2007040 + }, + "NhwcConv_29_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "op_tensor_size": 17244160, + "offset": 237972416, + "file_name": "cache/NhwcConv_0-conv_inConv_208.const", + "file_size": 17244160 + }, + "GroupNorm_18_wts_6_0_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 255216576, + "file_name": "cache/NhwcConv_0-conv_inConv_209.const", + "file_size": 5120 + }, + "NhwcConv_30_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 255221696, + "file_name": "cache/NhwcConv_0-conv_inConv_210.const", + "file_size": 16916480 + }, + "GroupNorm_19_wts_6_0_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 272138176, + "file_name": "cache/NhwcConv_0-conv_inConv_211.const", + "file_size": 5120 + }, + "NhwcConv_31_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 272143296, + "file_name": "cache/NhwcConv_0-conv_inConv_212.const", + "file_size": 16916480 + }, + "GroupNorm_20_wts_6_0_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 289059776, + "file_name": "cache/NhwcConv_0-conv_inConv_213.const", + "file_size": 5120 + }, + "NhwcConv_32_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 289064896, + "file_name": "cache/NhwcConv_0-conv_inConv_214.const", + "file_size": 16916480 + }, + "GroupNorm_21_wts_6_0_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 305981376, + "file_name": "cache/NhwcConv_0-conv_inConv_215.const", + "file_size": 5120 + }, + "NhwcConv_33_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 305986496, + "file_name": "cache/NhwcConv_0-conv_inConv_216.const", + "file_size": 16916480 + }, + "GroupNorm_22_wts_6_0_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 322902976, + "file_name": "cache/NhwcConv_0-conv_inConv_217.const", + "file_size": 5120 + }, + "NhwcConv_34_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 322908096, + "file_name": "cache/NhwcConv_0-conv_inConv_218.const", + "file_size": 16916480 + }, + "GroupNorm_23_wts_6_0_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 339824576, + "file_name": "cache/NhwcConv_0-conv_inConv_219.const", + "file_size": 5120 + }, + "NhwcConv_35_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 339829696, + "file_name": "cache/NhwcConv_0-conv_inConv_220.const", + "file_size": 16916480 + }, + "GroupNorm_24_wts_6_2_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 356746176, + "file_name": "cache/NhwcConv_0-conv_inConv_221.const", + "file_size": 5120 + }, + "NhwcConv_36_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "op_tensor_size": 2048000, + "offset": 356751296, + "file_name": "cache/NhwcConv_0-conv_inConv_222.const", + "file_size": 2048000 + }, + "mid_block.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 358799296, + "file_name": "cache/NhwcConv_0-conv_inConv_223.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 358801856, + "file_name": "cache/NhwcConv_0-conv_inConv_224.const", + "file_size": 2560 + }, + "Attention_6_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 358804416, + "file_name": "cache/NhwcConv_0-conv_inConv_225.const", + "file_size": 1868800 + }, + "Attention_6_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 360673216, + "file_name": "cache/NhwcConv_0-conv_inConv_226.const", + "file_size": 1868800 + }, + "Attention_6_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 362542016, + "file_name": "cache/NhwcConv_0-conv_inConv_227.const", + "file_size": 1868800 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_key.out2_4_18_bfp.out9_121_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 364410816, + "file_name": "cache/NhwcConv_0-conv_inConv_228.const", + "file_size": 128 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_query.out2_4_19_bfp.out9_120_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 364410944, + "file_name": "cache/NhwcConv_0-conv_inConv_229.const", + "file_size": 128 + }, + "/mid_block/attentions.0/transformer_blocks.0/norm1/LayerNormalization_output_0_bias_value.out2_4_20_bfp.out9_122_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 364411072, + "file_name": "cache/NhwcConv_0-conv_inConv_230.const", + "file_size": 128 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn1/Reshape_3_output_0.out2_3_26_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 364411200, + "file_name": "cache/NhwcConv_0-conv_inConv_231.const", + "file_size": 128 + }, + "onnx::MatMul_5846_11_0_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "op_tensor_size": 1894400, + "offset": 364411328, + "file_name": "cache/NhwcConv_0-conv_inConv_232.const", + "file_size": 1894400 + }, + "mid_block.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 366305728, + "file_name": "cache/NhwcConv_0-conv_inConv_233.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 366308288, + "file_name": "cache/NhwcConv_0-conv_inConv_234.const", + "file_size": 2560 + }, + "onnx::MatMul_5847": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 366310848, + "file_name": "cache/NhwcConv_0-conv_inConv_235.const", + "file_size": 1868800 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_38_bfp.out9_18_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 368179648, + "file_name": "cache/NhwcConv_0-conv_inConv_236.const", + "file_size": 128 + }, + "/mid_block/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_27_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 368179776, + "file_name": "cache/NhwcConv_0-conv_inConv_237.const", + "file_size": 128 + }, + "onnx::MatMul_5857_11_0_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1894400 + ], + "size_in_bytes": 1894400, + "op_tensor_size": 1894400, + "offset": 368179904, + "file_name": "cache/NhwcConv_0-conv_inConv_238.const", + "file_size": 1894400 + }, + "mid_block.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 370074304, + "file_name": "cache/NhwcConv_0-conv_inConv_239.const", + "file_size": 2560 + }, + "mid_block.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 370076864, + "file_name": "cache/NhwcConv_0-conv_inConv_240.const", + "file_size": 2560 + }, + "onnx::MatMul_5858_11_0_26_12_6_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 370079424, + "file_name": "cache/NhwcConv_0-conv_inConv_241.const", + "file_size": 7475200 + }, + "onnx::MatMul_5858_11_0_26_12_6_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 377554624, + "file_name": "cache/NhwcConv_0-conv_inConv_242.const", + "file_size": 7475200 + }, + "onnx::MatMul_5859_11_0_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 385029824, + "file_name": "cache/NhwcConv_0-conv_inConv_243.const", + "file_size": 7475200 + }, + "NhwcConv_37_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2048000 + ], + "size_in_bytes": 2048000, + "op_tensor_size": 2048000, + "offset": 392505024, + "file_name": "cache/NhwcConv_0-conv_inConv_244.const", + "file_size": 2048000 + }, + "GroupNorm_25_wts_6_0_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 394553024, + "file_name": "cache/NhwcConv_0-conv_inConv_245.const", + "file_size": 5120 + }, + "NhwcConv_38_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 394558144, + "file_name": "cache/NhwcConv_0-conv_inConv_246.const", + "file_size": 16916480 + }, + "GroupNorm_26_wts_6_0_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 411474624, + "file_name": "cache/NhwcConv_0-conv_inConv_247.const", + "file_size": 5120 + }, + "NhwcConv_39_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 411479744, + "file_name": "cache/NhwcConv_0-conv_inConv_248.const", + "file_size": 16916480 + }, + "GroupNorm_27_wts_6_0_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "op_tensor_size": 10240, + "offset": 428396224, + "file_name": "cache/NhwcConv_0-conv_inConv_249.const", + "file_size": 10240 + }, + "NhwcConv_40_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 33832960 + ], + "size_in_bytes": 33832960, + "op_tensor_size": 33832960, + "offset": 428406464, + "file_name": "cache/NhwcConv_0-conv_inConv_250.const", + "file_size": 33832960 + }, + "GroupNorm_28_wts_6_0_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 462239424, + "file_name": "cache/NhwcConv_0-conv_inConv_251.const", + "file_size": 5120 + }, + "NhwcConv_41_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 462244544, + "file_name": "cache/NhwcConv_0-conv_inConv_252.const", + "file_size": 16916480 + }, + "NhwcConv_42_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "op_tensor_size": 4096000, + "offset": 479161024, + "file_name": "cache/NhwcConv_0-conv_inConv_253.const", + "file_size": 4096000 + }, + "GroupNorm_29_wts_6_0_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "op_tensor_size": 10240, + "offset": 483257024, + "file_name": "cache/NhwcConv_0-conv_inConv_254.const", + "file_size": 10240 + }, + "NhwcConv_43_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 33832960 + ], + "size_in_bytes": 33832960, + "op_tensor_size": 33832960, + "offset": 483267264, + "file_name": "cache/NhwcConv_0-conv_inConv_255.const", + "file_size": 33832960 + }, + "GroupNorm_30_wts_6_0_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 517100224, + "file_name": "cache/NhwcConv_0-conv_inConv_256.const", + "file_size": 5120 + }, + "NhwcConv_44_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 517105344, + "file_name": "cache/NhwcConv_0-conv_inConv_257.const", + "file_size": 16916480 + }, + "NhwcConv_45_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "op_tensor_size": 4096000, + "offset": 534021824, + "file_name": "cache/NhwcConv_0-conv_inConv_258.const", + "file_size": 4096000 + }, + "GroupNorm_31_wts_6_0_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "op_tensor_size": 10240, + "offset": 538117824, + "file_name": "cache/NhwcConv_0-conv_inConv_259.const", + "file_size": 10240 + }, + "NhwcConv_46_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 33832960 + ], + "size_in_bytes": 33832960, + "op_tensor_size": 33832960, + "offset": 538128064, + "file_name": "cache/NhwcConv_0-conv_inConv_260.const", + "file_size": 33832960 + }, + "GroupNorm_32_wts_6_0_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 571961024, + "file_name": "cache/NhwcConv_0-conv_inConv_261.const", + "file_size": 5120 + }, + "NhwcConv_47_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 571966144, + "file_name": "cache/NhwcConv_0-conv_inConv_262.const", + "file_size": 16916480 + }, + "NhwcConv_48_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4096000 + ], + "size_in_bytes": 4096000, + "op_tensor_size": 4096000, + "offset": 588882624, + "file_name": "cache/NhwcConv_0-conv_inConv_263.const", + "file_size": 4096000 + }, + "/up_blocks.0/upsamplers.0/Resize.weights3_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "op_tensor_size": 256, + "offset": 592978624, + "file_name": "cache/NhwcConv_0-conv_inConv_264.const", + "file_size": 256 + }, + "NhwcConv_49_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 592978880, + "file_name": "cache/NhwcConv_0-conv_inConv_265.const", + "file_size": 16916480 + }, + "GroupNorm_33_wts_6_0_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "op_tensor_size": 10240, + "offset": 609895360, + "file_name": "cache/NhwcConv_0-conv_inConv_266.const", + "file_size": 10240 + }, + "NhwcConv_50_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 33832960 + ], + "size_in_bytes": 33832960, + "op_tensor_size": 33832960, + "offset": 609905600, + "file_name": "cache/NhwcConv_0-conv_inConv_267.const", + "file_size": 33832960 + }, + "GroupNorm_34_wts_6_0_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 643738560, + "file_name": "cache/NhwcConv_0-conv_inConv_268.const", + "file_size": 5120 + }, + "NhwcConv_51_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 643743680, + "file_name": "cache/NhwcConv_0-conv_inConv_269.const", + "file_size": 16916480 + }, + "NhwcConv_52_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4014080 + ], + "size_in_bytes": 4014080, + "op_tensor_size": 4014080, + "offset": 660660160, + "file_name": "cache/NhwcConv_0-conv_inConv_270.const", + "file_size": 4014080 + }, + "GroupNorm_35_wts_6_2_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 664674240, + "file_name": "cache/NhwcConv_0-conv_inConv_271.const", + "file_size": 5120 + }, + "NhwcConv_53_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 664679360, + "file_name": "cache/NhwcConv_0-conv_inConv_272.const", + "file_size": 2007040 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 666686400, + "file_name": "cache/NhwcConv_0-conv_inConv_273.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 666688960, + "file_name": "cache/NhwcConv_0-conv_inConv_274.const", + "file_size": 2560 + }, + "Attention_7_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 666691520, + "file_name": "cache/NhwcConv_0-conv_inConv_275.const", + "file_size": 1868800 + }, + "Attention_7_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 668560320, + "file_name": "cache/NhwcConv_0-conv_inConv_276.const", + "file_size": 1868800 + }, + "Attention_7_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 670429120, + "file_name": "cache/NhwcConv_0-conv_inConv_277.const", + "file_size": 1868800 + }, + "onnx::MatMul_5893_11_0_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 672297920, + "file_name": "cache/NhwcConv_0-conv_inConv_278.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 674166720, + "file_name": "cache/NhwcConv_0-conv_inConv_279.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 674169280, + "file_name": "cache/NhwcConv_0-conv_inConv_280.const", + "file_size": 2560 + }, + "onnx::MatMul_5894": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 674171840, + "file_name": "cache/NhwcConv_0-conv_inConv_281.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_39_bfp.out9_21_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 676040640, + "file_name": "cache/NhwcConv_0-conv_inConv_282.const", + "file_size": 128 + }, + "/up_blocks.1/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_31_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 676040768, + "file_name": "cache/NhwcConv_0-conv_inConv_283.const", + "file_size": 128 + }, + "onnx::MatMul_5904_11_0_29": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 676040896, + "file_name": "cache/NhwcConv_0-conv_inConv_284.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 677909696, + "file_name": "cache/NhwcConv_0-conv_inConv_285.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 677912256, + "file_name": "cache/NhwcConv_0-conv_inConv_286.const", + "file_size": 2560 + }, + "onnx::MatMul_5905_11_0_30_12_7_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 677914816, + "file_name": "cache/NhwcConv_0-conv_inConv_287.const", + "file_size": 7475200 + }, + "onnx::MatMul_5905_11_0_30_12_7_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 685390016, + "file_name": "cache/NhwcConv_0-conv_inConv_288.const", + "file_size": 7475200 + }, + "onnx::MatMul_5906_11_0_31": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 692865216, + "file_name": "cache/NhwcConv_0-conv_inConv_289.const", + "file_size": 7475200 + }, + "NhwcConv_54_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 700340416, + "file_name": "cache/NhwcConv_0-conv_inConv_290.const", + "file_size": 2007040 + }, + "GroupNorm_36_wts_6_0_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 5120 + ], + "size_in_bytes": 10240, + "op_tensor_size": 10240, + "offset": 702347456, + "file_name": "cache/NhwcConv_0-conv_inConv_291.const", + "file_size": 10240 + }, + "NhwcConv_55_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 33832960 + ], + "size_in_bytes": 33832960, + "op_tensor_size": 33832960, + "offset": 702357696, + "file_name": "cache/NhwcConv_0-conv_inConv_292.const", + "file_size": 33832960 + }, + "GroupNorm_37_wts_6_0_29": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 736190656, + "file_name": "cache/NhwcConv_0-conv_inConv_293.const", + "file_size": 5120 + }, + "NhwcConv_56_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 736195776, + "file_name": "cache/NhwcConv_0-conv_inConv_294.const", + "file_size": 16916480 + }, + "NhwcConv_57_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4014080 + ], + "size_in_bytes": 4014080, + "op_tensor_size": 4014080, + "offset": 753112256, + "file_name": "cache/NhwcConv_0-conv_inConv_295.const", + "file_size": 4014080 + }, + "GroupNorm_38_wts_6_2_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 757126336, + "file_name": "cache/NhwcConv_0-conv_inConv_296.const", + "file_size": 5120 + }, + "NhwcConv_58_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 757131456, + "file_name": "cache/NhwcConv_0-conv_inConv_297.const", + "file_size": 2007040 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 759138496, + "file_name": "cache/NhwcConv_0-conv_inConv_298.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 759141056, + "file_name": "cache/NhwcConv_0-conv_inConv_299.const", + "file_size": 2560 + }, + "Attention_8_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 759143616, + "file_name": "cache/NhwcConv_0-conv_inConv_300.const", + "file_size": 1868800 + }, + "Attention_8_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 761012416, + "file_name": "cache/NhwcConv_0-conv_inConv_301.const", + "file_size": 1868800 + }, + "Attention_8_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 762881216, + "file_name": "cache/NhwcConv_0-conv_inConv_302.const", + "file_size": 1868800 + }, + "onnx::MatMul_5923_11_0_32": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 764750016, + "file_name": "cache/NhwcConv_0-conv_inConv_303.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 766618816, + "file_name": "cache/NhwcConv_0-conv_inConv_304.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 766621376, + "file_name": "cache/NhwcConv_0-conv_inConv_305.const", + "file_size": 2560 + }, + "onnx::MatMul_5924": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 766623936, + "file_name": "cache/NhwcConv_0-conv_inConv_306.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_40_bfp.out9_24_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 768492736, + "file_name": "cache/NhwcConv_0-conv_inConv_307.const", + "file_size": 128 + }, + "/up_blocks.1/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_35_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 768492864, + "file_name": "cache/NhwcConv_0-conv_inConv_308.const", + "file_size": 128 + }, + "onnx::MatMul_5934_11_0_33": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 768492992, + "file_name": "cache/NhwcConv_0-conv_inConv_309.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 770361792, + "file_name": "cache/NhwcConv_0-conv_inConv_310.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 770364352, + "file_name": "cache/NhwcConv_0-conv_inConv_311.const", + "file_size": 2560 + }, + "onnx::MatMul_5935_11_0_34_12_8_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 770366912, + "file_name": "cache/NhwcConv_0-conv_inConv_312.const", + "file_size": 7475200 + }, + "onnx::MatMul_5935_11_0_34_12_8_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 777842112, + "file_name": "cache/NhwcConv_0-conv_inConv_313.const", + "file_size": 7475200 + }, + "onnx::MatMul_5936_11_0_35": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 785317312, + "file_name": "cache/NhwcConv_0-conv_inConv_314.const", + "file_size": 7475200 + }, + "NhwcConv_59_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 792792512, + "file_name": "cache/NhwcConv_0-conv_inConv_315.const", + "file_size": 2007040 + }, + "GroupNorm_39_wts_6_0_30": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 3840 + ], + "size_in_bytes": 7680, + "op_tensor_size": 7680, + "offset": 794799552, + "file_name": "cache/NhwcConv_0-conv_inConv_316.const", + "file_size": 7680 + }, + "NhwcConv_60_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 25374720 + ], + "size_in_bytes": 25374720, + "op_tensor_size": 25374720, + "offset": 794807232, + "file_name": "cache/NhwcConv_0-conv_inConv_317.const", + "file_size": 25374720 + }, + "GroupNorm_40_wts_6_0_31": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 820181952, + "file_name": "cache/NhwcConv_0-conv_inConv_318.const", + "file_size": 5120 + }, + "NhwcConv_61_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 16916480 + ], + "size_in_bytes": 16916480, + "op_tensor_size": 16916480, + "offset": 820187072, + "file_name": "cache/NhwcConv_0-conv_inConv_319.const", + "file_size": 16916480 + }, + "NhwcConv_62_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 3010560 + ], + "size_in_bytes": 3010560, + "op_tensor_size": 3010560, + "offset": 837103552, + "file_name": "cache/NhwcConv_0-conv_inConv_320.const", + "file_size": 3010560 + }, + "GroupNorm_41_wts_6_2_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 840114112, + "file_name": "cache/NhwcConv_0-conv_inConv_321.const", + "file_size": 5120 + }, + "NhwcConv_63_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 840119232, + "file_name": "cache/NhwcConv_0-conv_inConv_322.const", + "file_size": 2007040 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 842126272, + "file_name": "cache/NhwcConv_0-conv_inConv_323.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 842128832, + "file_name": "cache/NhwcConv_0-conv_inConv_324.const", + "file_size": 2560 + }, + "Attention_9_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 842131392, + "file_name": "cache/NhwcConv_0-conv_inConv_325.const", + "file_size": 1868800 + }, + "Attention_9_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 844000192, + "file_name": "cache/NhwcConv_0-conv_inConv_326.const", + "file_size": 1868800 + }, + "Attention_9_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 845868992, + "file_name": "cache/NhwcConv_0-conv_inConv_327.const", + "file_size": 1868800 + }, + "onnx::MatMul_5953_11_0_36": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 847737792, + "file_name": "cache/NhwcConv_0-conv_inConv_328.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 849606592, + "file_name": "cache/NhwcConv_0-conv_inConv_329.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 849609152, + "file_name": "cache/NhwcConv_0-conv_inConv_330.const", + "file_size": 2560 + }, + "onnx::MatMul_5954": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 849611712, + "file_name": "cache/NhwcConv_0-conv_inConv_331.const", + "file_size": 1868800 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_41_bfp.out9_27_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 851480512, + "file_name": "cache/NhwcConv_0-conv_inConv_332.const", + "file_size": 128 + }, + "/up_blocks.1/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_39_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 851480640, + "file_name": "cache/NhwcConv_0-conv_inConv_333.const", + "file_size": 128 + }, + "onnx::MatMul_5964_11_0_37": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 851480768, + "file_name": "cache/NhwcConv_0-conv_inConv_334.const", + "file_size": 1868800 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 853349568, + "file_name": "cache/NhwcConv_0-conv_inConv_335.const", + "file_size": 2560 + }, + "up_blocks.1.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 853352128, + "file_name": "cache/NhwcConv_0-conv_inConv_336.const", + "file_size": 2560 + }, + "onnx::MatMul_5965_11_0_38_12_9_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 853354688, + "file_name": "cache/NhwcConv_0-conv_inConv_337.const", + "file_size": 7475200 + }, + "onnx::MatMul_5965_11_0_38_12_9_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 860829888, + "file_name": "cache/NhwcConv_0-conv_inConv_338.const", + "file_size": 7475200 + }, + "onnx::MatMul_5966_11_0_39": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 7475200 + ], + "size_in_bytes": 7475200, + "op_tensor_size": 7475200, + "offset": 868305088, + "file_name": "cache/NhwcConv_0-conv_inConv_339.const", + "file_size": 7475200 + }, + "NhwcConv_64_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2007040 + ], + "size_in_bytes": 2007040, + "op_tensor_size": 2007040, + "offset": 875780288, + "file_name": "cache/NhwcConv_0-conv_inConv_340.const", + "file_size": 2007040 + }, + "/up_blocks.1/upsamplers.0/Resize.weights3_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "op_tensor_size": 256, + "offset": 877787328, + "file_name": "cache/NhwcConv_0-conv_inConv_341.const", + "file_size": 256 + }, + "NhwcConv_65_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 17244160 + ], + "size_in_bytes": 17244160, + "op_tensor_size": 17244160, + "offset": 877787584, + "file_name": "cache/NhwcConv_0-conv_inConv_342.const", + "file_size": 17244160 + }, + "GroupNorm_42_wts_6_0_32": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 3840 + ], + "size_in_bytes": 7680, + "op_tensor_size": 7680, + "offset": 895031744, + "file_name": "cache/NhwcConv_0-conv_inConv_343.const", + "file_size": 7680 + }, + "NhwcConv_66_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 12851200 + ], + "size_in_bytes": 12851200, + "op_tensor_size": 12851200, + "offset": 895039424, + "file_name": "cache/NhwcConv_0-conv_inConv_344.const", + "file_size": 12851200 + }, + "GroupNorm_43_wts_6_0_33": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 907890624, + "file_name": "cache/NhwcConv_0-conv_inConv_345.const", + "file_size": 2560 + }, + "NhwcConv_67_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 907893184, + "file_name": "cache/NhwcConv_0-conv_inConv_346.const", + "file_size": 4311040 + }, + "NhwcConv_68_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1505280 + ], + "size_in_bytes": 1505280, + "op_tensor_size": 1505280, + "offset": 912204224, + "file_name": "cache/NhwcConv_0-conv_inConv_347.const", + "file_size": 1505280 + }, + "GroupNorm_44_wts_6_2_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 913709504, + "file_name": "cache/NhwcConv_0-conv_inConv_348.const", + "file_size": 2560 + }, + "NhwcConv_69_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 913712064, + "file_name": "cache/NhwcConv_0-conv_inConv_349.const", + "file_size": 501760 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 914213824, + "file_name": "cache/NhwcConv_0-conv_inConv_350.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 914215104, + "file_name": "cache/NhwcConv_0-conv_inConv_351.const", + "file_size": 1280 + }, + "Attention_10_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 914216384, + "file_name": "cache/NhwcConv_0-conv_inConv_352.const", + "file_size": 473600 + }, + "Attention_10_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 914689984, + "file_name": "cache/NhwcConv_0-conv_inConv_353.const", + "file_size": 473600 + }, + "Attention_10_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 915163584, + "file_name": "cache/NhwcConv_0-conv_inConv_354.const", + "file_size": 473600 + }, + "onnx::MatMul_5984_11_0_40": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 915637184, + "file_name": "cache/NhwcConv_0-conv_inConv_355.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 916110784, + "file_name": "cache/NhwcConv_0-conv_inConv_356.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 916112064, + "file_name": "cache/NhwcConv_0-conv_inConv_357.const", + "file_size": 1280 + }, + "onnx::MatMul_5985": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 916113344, + "file_name": "cache/NhwcConv_0-conv_inConv_358.const", + "file_size": 473600 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_42_bfp.out9_30_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 916586944, + "file_name": "cache/NhwcConv_0-conv_inConv_359.const", + "file_size": 128 + }, + "/up_blocks.2/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_43_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 916587072, + "file_name": "cache/NhwcConv_0-conv_inConv_360.const", + "file_size": 128 + }, + "onnx::MatMul_5995_11_0_41": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 916587200, + "file_name": "cache/NhwcConv_0-conv_inConv_361.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 917060800, + "file_name": "cache/NhwcConv_0-conv_inConv_362.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 917062080, + "file_name": "cache/NhwcConv_0-conv_inConv_363.const", + "file_size": 1280 + }, + "onnx::MatMul_5996_11_0_42_12_10_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 917063360, + "file_name": "cache/NhwcConv_0-conv_inConv_364.const", + "file_size": 1868800 + }, + "onnx::MatMul_5996_11_0_42_12_10_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 918932160, + "file_name": "cache/NhwcConv_0-conv_inConv_365.const", + "file_size": 1868800 + }, + "onnx::MatMul_5997_11_0_43": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "op_tensor_size": 1884160, + "offset": 920800960, + "file_name": "cache/NhwcConv_0-conv_inConv_366.const", + "file_size": 1884160 + }, + "NhwcConv_70_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 922685120, + "file_name": "cache/NhwcConv_0-conv_inConv_367.const", + "file_size": 501760 + }, + "GroupNorm_45_wts_6_0_34": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 2560 + ], + "size_in_bytes": 5120, + "op_tensor_size": 5120, + "offset": 923186880, + "file_name": "cache/NhwcConv_0-conv_inConv_368.const", + "file_size": 5120 + }, + "NhwcConv_71_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 8622080 + ], + "size_in_bytes": 8622080, + "op_tensor_size": 8622080, + "offset": 923192000, + "file_name": "cache/NhwcConv_0-conv_inConv_369.const", + "file_size": 8622080 + }, + "GroupNorm_46_wts_6_0_35": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 931814080, + "file_name": "cache/NhwcConv_0-conv_inConv_370.const", + "file_size": 2560 + }, + "NhwcConv_72_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 931816640, + "file_name": "cache/NhwcConv_0-conv_inConv_371.const", + "file_size": 4311040 + }, + "NhwcConv_73_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1003520 + ], + "size_in_bytes": 1003520, + "op_tensor_size": 1003520, + "offset": 936127680, + "file_name": "cache/NhwcConv_0-conv_inConv_372.const", + "file_size": 1003520 + }, + "GroupNorm_47_wts_6_2_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 937131200, + "file_name": "cache/NhwcConv_0-conv_inConv_373.const", + "file_size": 2560 + }, + "NhwcConv_74_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 937133760, + "file_name": "cache/NhwcConv_0-conv_inConv_374.const", + "file_size": 501760 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 937635520, + "file_name": "cache/NhwcConv_0-conv_inConv_375.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 937636800, + "file_name": "cache/NhwcConv_0-conv_inConv_376.const", + "file_size": 1280 + }, + "Attention_11_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 937638080, + "file_name": "cache/NhwcConv_0-conv_inConv_377.const", + "file_size": 473600 + }, + "Attention_11_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 938111680, + "file_name": "cache/NhwcConv_0-conv_inConv_378.const", + "file_size": 473600 + }, + "Attention_11_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 938585280, + "file_name": "cache/NhwcConv_0-conv_inConv_379.const", + "file_size": 473600 + }, + "onnx::MatMul_6014_11_0_44": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 939058880, + "file_name": "cache/NhwcConv_0-conv_inConv_380.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 939532480, + "file_name": "cache/NhwcConv_0-conv_inConv_381.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 939533760, + "file_name": "cache/NhwcConv_0-conv_inConv_382.const", + "file_size": 1280 + }, + "onnx::MatMul_6015": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 939535040, + "file_name": "cache/NhwcConv_0-conv_inConv_383.const", + "file_size": 473600 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_43_bfp.out9_33_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 940008640, + "file_name": "cache/NhwcConv_0-conv_inConv_384.const", + "file_size": 128 + }, + "/up_blocks.2/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_47_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 940008768, + "file_name": "cache/NhwcConv_0-conv_inConv_385.const", + "file_size": 128 + }, + "onnx::MatMul_6025_11_0_45": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 940008896, + "file_name": "cache/NhwcConv_0-conv_inConv_386.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 940482496, + "file_name": "cache/NhwcConv_0-conv_inConv_387.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 940483776, + "file_name": "cache/NhwcConv_0-conv_inConv_388.const", + "file_size": 1280 + }, + "onnx::MatMul_6026_11_0_46_12_11_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 940485056, + "file_name": "cache/NhwcConv_0-conv_inConv_389.const", + "file_size": 1868800 + }, + "onnx::MatMul_6026_11_0_46_12_11_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 942353856, + "file_name": "cache/NhwcConv_0-conv_inConv_390.const", + "file_size": 1868800 + }, + "onnx::MatMul_6027_11_0_47": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "op_tensor_size": 1884160, + "offset": 944222656, + "file_name": "cache/NhwcConv_0-conv_inConv_391.const", + "file_size": 1884160 + }, + "NhwcConv_75_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 946106816, + "file_name": "cache/NhwcConv_0-conv_inConv_392.const", + "file_size": 501760 + }, + "GroupNorm_48_wts_6_0_36": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1920 + ], + "size_in_bytes": 3840, + "op_tensor_size": 3840, + "offset": 946608576, + "file_name": "cache/NhwcConv_0-conv_inConv_393.const", + "file_size": 3840 + }, + "NhwcConv_76_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 6425600 + ], + "size_in_bytes": 6425600, + "op_tensor_size": 6425600, + "offset": 946612416, + "file_name": "cache/NhwcConv_0-conv_inConv_394.const", + "file_size": 6425600 + }, + "GroupNorm_49_wts_6_0_37": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 953038016, + "file_name": "cache/NhwcConv_0-conv_inConv_395.const", + "file_size": 2560 + }, + "NhwcConv_77_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 953040576, + "file_name": "cache/NhwcConv_0-conv_inConv_396.const", + "file_size": 4311040 + }, + "NhwcConv_78_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 752640 + ], + "size_in_bytes": 752640, + "op_tensor_size": 752640, + "offset": 957351616, + "file_name": "cache/NhwcConv_0-conv_inConv_397.const", + "file_size": 752640 + }, + "GroupNorm_50_wts_6_2_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 958104256, + "file_name": "cache/NhwcConv_0-conv_inConv_398.const", + "file_size": 2560 + }, + "NhwcConv_79_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 958106816, + "file_name": "cache/NhwcConv_0-conv_inConv_399.const", + "file_size": 501760 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 958608576, + "file_name": "cache/NhwcConv_0-conv_inConv_400.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 958609856, + "file_name": "cache/NhwcConv_0-conv_inConv_401.const", + "file_size": 1280 + }, + "Attention_12_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 958611136, + "file_name": "cache/NhwcConv_0-conv_inConv_402.const", + "file_size": 473600 + }, + "Attention_12_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 959084736, + "file_name": "cache/NhwcConv_0-conv_inConv_403.const", + "file_size": 473600 + }, + "Attention_12_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 959558336, + "file_name": "cache/NhwcConv_0-conv_inConv_404.const", + "file_size": 473600 + }, + "onnx::MatMul_6044_11_0_48": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 960031936, + "file_name": "cache/NhwcConv_0-conv_inConv_405.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 960505536, + "file_name": "cache/NhwcConv_0-conv_inConv_406.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 960506816, + "file_name": "cache/NhwcConv_0-conv_inConv_407.const", + "file_size": 1280 + }, + "onnx::MatMul_6045": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 960508096, + "file_name": "cache/NhwcConv_0-conv_inConv_408.const", + "file_size": 473600 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_44_bfp.out9_36_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 960981696, + "file_name": "cache/NhwcConv_0-conv_inConv_409.const", + "file_size": 128 + }, + "/up_blocks.2/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_51_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 960981824, + "file_name": "cache/NhwcConv_0-conv_inConv_410.const", + "file_size": 128 + }, + "onnx::MatMul_6055_11_0_49": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 473600 + ], + "size_in_bytes": 473600, + "op_tensor_size": 473600, + "offset": 960981952, + "file_name": "cache/NhwcConv_0-conv_inConv_411.const", + "file_size": 473600 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 961455552, + "file_name": "cache/NhwcConv_0-conv_inConv_412.const", + "file_size": 1280 + }, + "up_blocks.2.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 961456832, + "file_name": "cache/NhwcConv_0-conv_inConv_413.const", + "file_size": 1280 + }, + "onnx::MatMul_6056_11_0_50_12_12_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 961458112, + "file_name": "cache/NhwcConv_0-conv_inConv_414.const", + "file_size": 1868800 + }, + "onnx::MatMul_6056_11_0_50_12_12_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1868800 + ], + "size_in_bytes": 1868800, + "op_tensor_size": 1868800, + "offset": 963326912, + "file_name": "cache/NhwcConv_0-conv_inConv_415.const", + "file_size": 1868800 + }, + "onnx::MatMul_6057_11_0_51": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1884160 + ], + "size_in_bytes": 1884160, + "op_tensor_size": 1884160, + "offset": 965195712, + "file_name": "cache/NhwcConv_0-conv_inConv_416.const", + "file_size": 1884160 + }, + "NhwcConv_80_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 501760 + ], + "size_in_bytes": 501760, + "op_tensor_size": 501760, + "offset": 967079872, + "file_name": "cache/NhwcConv_0-conv_inConv_417.const", + "file_size": 501760 + }, + "/up_blocks.2/upsamplers.0/Resize.weights3_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "op_tensor_size": 256, + "offset": 967581632, + "file_name": "cache/NhwcConv_0-conv_inConv_418.const", + "file_size": 256 + }, + "NhwcConv_81_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 4311040 + ], + "size_in_bytes": 4311040, + "op_tensor_size": 4311040, + "offset": 967581888, + "file_name": "cache/NhwcConv_0-conv_inConv_419.const", + "file_size": 4311040 + }, + "GroupNorm_51_wts_6_0_38": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1920 + ], + "size_in_bytes": 3840, + "op_tensor_size": 3840, + "offset": 971892928, + "file_name": "cache/NhwcConv_0-conv_inConv_420.const", + "file_size": 3840 + }, + "NhwcConv_82_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 3212800 + ], + "size_in_bytes": 3212800, + "op_tensor_size": 3212800, + "offset": 971896768, + "file_name": "cache/NhwcConv_0-conv_inConv_421.const", + "file_size": 3212800 + }, + "GroupNorm_52_wts_6_0_39": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 975109568, + "file_name": "cache/NhwcConv_0-conv_inConv_422.const", + "file_size": 1280 + }, + "NhwcConv_83_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 975110848, + "file_name": "cache/NhwcConv_0-conv_inConv_423.const", + "file_size": 1077760 + }, + "NhwcConv_84_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 376320 + ], + "size_in_bytes": 376320, + "op_tensor_size": 376320, + "offset": 976188608, + "file_name": "cache/NhwcConv_0-conv_inConv_424.const", + "file_size": 376320 + }, + "GroupNorm_53_wts_6_2_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 976564928, + "file_name": "cache/NhwcConv_0-conv_inConv_425.const", + "file_size": 1280 + }, + "NhwcConv_85_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 976566208, + "file_name": "cache/NhwcConv_0-conv_inConv_426.const", + "file_size": 125440 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 976691648, + "file_name": "cache/NhwcConv_0-conv_inConv_427.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 976692288, + "file_name": "cache/NhwcConv_0-conv_inConv_428.const", + "file_size": 640 + }, + "Attention_13_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 976692928, + "file_name": "cache/NhwcConv_0-conv_inConv_429.const", + "file_size": 118400 + }, + "Attention_13_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 976811328, + "file_name": "cache/NhwcConv_0-conv_inConv_430.const", + "file_size": 118400 + }, + "Attention_13_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 976929728, + "file_name": "cache/NhwcConv_0-conv_inConv_431.const", + "file_size": 118400 + }, + "onnx::MatMul_6075_11_0_52": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 977048128, + "file_name": "cache/NhwcConv_0-conv_inConv_432.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 977165888, + "file_name": "cache/NhwcConv_0-conv_inConv_433.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 977166528, + "file_name": "cache/NhwcConv_0-conv_inConv_434.const", + "file_size": 640 + }, + "onnx::MatMul_6076": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 977167168, + "file_name": "cache/NhwcConv_0-conv_inConv_435.const", + "file_size": 118400 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_45_bfp.out9_39_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 977285568, + "file_name": "cache/NhwcConv_0-conv_inConv_436.const", + "file_size": 128 + }, + "/up_blocks.3/attentions.0/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_55_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 977285696, + "file_name": "cache/NhwcConv_0-conv_inConv_437.const", + "file_size": 128 + }, + "onnx::MatMul_6086_11_0_53": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 977285824, + "file_name": "cache/NhwcConv_0-conv_inConv_438.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 977403584, + "file_name": "cache/NhwcConv_0-conv_inConv_439.const", + "file_size": 640 + }, + "up_blocks.3.attentions.0.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 977404224, + "file_name": "cache/NhwcConv_0-conv_inConv_440.const", + "file_size": 640 + }, + "onnx::MatMul_6087_11_0_54_12_13_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 977404864, + "file_name": "cache/NhwcConv_0-conv_inConv_441.const", + "file_size": 471040 + }, + "onnx::MatMul_6087_11_0_54_12_13_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 977875904, + "file_name": "cache/NhwcConv_0-conv_inConv_442.const", + "file_size": 471040 + }, + "onnx::MatMul_6088_11_0_55": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 978346944, + "file_name": "cache/NhwcConv_0-conv_inConv_443.const", + "file_size": 471040 + }, + "NhwcConv_86_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 978817984, + "file_name": "cache/NhwcConv_0-conv_inConv_444.const", + "file_size": 125440 + }, + "GroupNorm_54_wts_6_0_40": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 978943424, + "file_name": "cache/NhwcConv_0-conv_inConv_445.const", + "file_size": 2560 + }, + "NhwcConv_87_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2155520 + ], + "size_in_bytes": 2155520, + "op_tensor_size": 2155520, + "offset": 978945984, + "file_name": "cache/NhwcConv_0-conv_inConv_446.const", + "file_size": 2155520 + }, + "GroupNorm_55_wts_6_0_41": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 981101504, + "file_name": "cache/NhwcConv_0-conv_inConv_447.const", + "file_size": 1280 + }, + "NhwcConv_88_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 981102784, + "file_name": "cache/NhwcConv_0-conv_inConv_448.const", + "file_size": 1077760 + }, + "NhwcConv_89_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 250880 + ], + "size_in_bytes": 250880, + "op_tensor_size": 250880, + "offset": 982180544, + "file_name": "cache/NhwcConv_0-conv_inConv_449.const", + "file_size": 250880 + }, + "GroupNorm_56_wts_6_2_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 982431424, + "file_name": "cache/NhwcConv_0-conv_inConv_450.const", + "file_size": 1280 + }, + "NhwcConv_90_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 982432704, + "file_name": "cache/NhwcConv_0-conv_inConv_451.const", + "file_size": 125440 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 982558144, + "file_name": "cache/NhwcConv_0-conv_inConv_452.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 982558784, + "file_name": "cache/NhwcConv_0-conv_inConv_453.const", + "file_size": 640 + }, + "Attention_14_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 982559424, + "file_name": "cache/NhwcConv_0-conv_inConv_454.const", + "file_size": 118400 + }, + "Attention_14_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 982677824, + "file_name": "cache/NhwcConv_0-conv_inConv_455.const", + "file_size": 118400 + }, + "Attention_14_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 982796224, + "file_name": "cache/NhwcConv_0-conv_inConv_456.const", + "file_size": 118400 + }, + "onnx::MatMul_6105_11_0_56": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 982914624, + "file_name": "cache/NhwcConv_0-conv_inConv_457.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 983032384, + "file_name": "cache/NhwcConv_0-conv_inConv_458.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 983033024, + "file_name": "cache/NhwcConv_0-conv_inConv_459.const", + "file_size": 640 + }, + "onnx::MatMul_6106": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 983033664, + "file_name": "cache/NhwcConv_0-conv_inConv_460.const", + "file_size": 118400 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_46_bfp.out9_42_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 983152064, + "file_name": "cache/NhwcConv_0-conv_inConv_461.const", + "file_size": 128 + }, + "/up_blocks.3/attentions.1/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_59_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 983152192, + "file_name": "cache/NhwcConv_0-conv_inConv_462.const", + "file_size": 128 + }, + "onnx::MatMul_6116_11_0_57": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 983152320, + "file_name": "cache/NhwcConv_0-conv_inConv_463.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 983270080, + "file_name": "cache/NhwcConv_0-conv_inConv_464.const", + "file_size": 640 + }, + "up_blocks.3.attentions.1.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 983270720, + "file_name": "cache/NhwcConv_0-conv_inConv_465.const", + "file_size": 640 + }, + "onnx::MatMul_6117_11_0_58_12_14_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 983271360, + "file_name": "cache/NhwcConv_0-conv_inConv_466.const", + "file_size": 471040 + }, + "onnx::MatMul_6117_11_0_58_12_14_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 983742400, + "file_name": "cache/NhwcConv_0-conv_inConv_467.const", + "file_size": 471040 + }, + "onnx::MatMul_6118_11_0_59": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 984213440, + "file_name": "cache/NhwcConv_0-conv_inConv_468.const", + "file_size": 471040 + }, + "NhwcConv_91_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 984684480, + "file_name": "cache/NhwcConv_0-conv_inConv_469.const", + "file_size": 125440 + }, + "GroupNorm_57_wts_6_0_42": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1280 + ], + "size_in_bytes": 2560, + "op_tensor_size": 2560, + "offset": 984809920, + "file_name": "cache/NhwcConv_0-conv_inConv_470.const", + "file_size": 2560 + }, + "NhwcConv_92_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2155520 + ], + "size_in_bytes": 2155520, + "op_tensor_size": 2155520, + "offset": 984812480, + "file_name": "cache/NhwcConv_0-conv_inConv_471.const", + "file_size": 2155520 + }, + "GroupNorm_58_wts_6_0_43": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 986968000, + "file_name": "cache/NhwcConv_0-conv_inConv_472.const", + "file_size": 1280 + }, + "NhwcConv_93_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1077760 + ], + "size_in_bytes": 1077760, + "op_tensor_size": 1077760, + "offset": 986969280, + "file_name": "cache/NhwcConv_0-conv_inConv_473.const", + "file_size": 1077760 + }, + "NhwcConv_94_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 250880 + ], + "size_in_bytes": 250880, + "op_tensor_size": 250880, + "offset": 988047040, + "file_name": "cache/NhwcConv_0-conv_inConv_474.const", + "file_size": 250880 + }, + "GroupNorm_59_wts_6_2_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 988297920, + "file_name": "cache/NhwcConv_0-conv_inConv_475.const", + "file_size": 1280 + }, + "NhwcConv_95_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 988299200, + "file_name": "cache/NhwcConv_0-conv_inConv_476.const", + "file_size": 125440 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 988424640, + "file_name": "cache/NhwcConv_0-conv_inConv_477.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm1.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 988425280, + "file_name": "cache/NhwcConv_0-conv_inConv_478.const", + "file_size": 640 + }, + "Attention_15_qkv_weight_key": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 988425920, + "file_name": "cache/NhwcConv_0-conv_inConv_479.const", + "file_size": 118400 + }, + "Attention_15_qkv_weight_query": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 988544320, + "file_name": "cache/NhwcConv_0-conv_inConv_480.const", + "file_size": 118400 + }, + "Attention_15_qkv_weight_value": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 988662720, + "file_name": "cache/NhwcConv_0-conv_inConv_481.const", + "file_size": 118400 + }, + "onnx::MatMul_6135_11_0_60": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 988781120, + "file_name": "cache/NhwcConv_0-conv_inConv_482.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 988898880, + "file_name": "cache/NhwcConv_0-conv_inConv_483.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm2.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 988899520, + "file_name": "cache/NhwcConv_0-conv_inConv_484.const", + "file_size": 640 + }, + "onnx::MatMul_6136": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 118400 + ], + "size_in_bytes": 118400, + "op_tensor_size": 118400, + "offset": 988900160, + "file_name": "cache/NhwcConv_0-conv_inConv_485.const", + "file_size": 118400 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/to_q/MatMul_output_0.out2_6_47_bfp.out9_45_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 989018560, + "file_name": "cache/NhwcConv_0-conv_inConv_486.const", + "file_size": 128 + }, + "/up_blocks.3/attentions.2/transformer_blocks.0/attn2/Reshape_3_output_0.out2_3_63_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 989018688, + "file_name": "cache/NhwcConv_0-conv_inConv_487.const", + "file_size": 128 + }, + "onnx::MatMul_6146_11_0_61": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 117760 + ], + "size_in_bytes": 117760, + "op_tensor_size": 117760, + "offset": 989018816, + "file_name": "cache/NhwcConv_0-conv_inConv_488.const", + "file_size": 117760 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.weight": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 989136576, + "file_name": "cache/NhwcConv_0-conv_inConv_489.const", + "file_size": 640 + }, + "up_blocks.3.attentions.2.transformer_blocks.0.norm3.bias": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 320 + ], + "size_in_bytes": 640, + "op_tensor_size": 640, + "offset": 989137216, + "file_name": "cache/NhwcConv_0-conv_inConv_490.const", + "file_size": 640 + }, + "onnx::MatMul_6147_11_0_62_12_15_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 989137856, + "file_name": "cache/NhwcConv_0-conv_inConv_491.const", + "file_size": 471040 + }, + "onnx::MatMul_6147_11_0_62_12_15_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 989608896, + "file_name": "cache/NhwcConv_0-conv_inConv_492.const", + "file_size": 471040 + }, + "onnx::MatMul_6148_11_0_63": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 471040 + ], + "size_in_bytes": 471040, + "op_tensor_size": 471040, + "offset": 990079936, + "file_name": "cache/NhwcConv_0-conv_inConv_493.const", + "file_size": 471040 + }, + "NhwcConv_96_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 125440 + ], + "size_in_bytes": 125440, + "op_tensor_size": 125440, + "offset": 990550976, + "file_name": "cache/NhwcConv_0-conv_inConv_494.const", + "file_size": 125440 + }, + "GroupNorm_60_wts_6_0_44": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 640 + ], + "size_in_bytes": 1280, + "op_tensor_size": 1280, + "offset": 990676416, + "file_name": "cache/NhwcConv_0-conv_inConv_495.const", + "file_size": 1280 + }, + "GroupNorm_60.out7_60.out6_0_44_bfp.out7_60_bfp.wts": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 64 + ], + "size_in_bytes": 128, + "op_tensor_size": 128, + "offset": 990677696, + "file_name": "cache/NhwcConv_0-conv_inConv_496.const", + "file_size": 128 + }, + "NhwcConv_97_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 54400 + ], + "size_in_bytes": 54400, + "op_tensor_size": 54400, + "offset": 990677824, + "file_name": "cache/NhwcConv_0-conv_inConv_497.const", + "file_size": 54400 + } + }, + "aux_info": {} } \ No newline at end of file diff --git a/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt new file mode 100644 index 0000000000000000000000000000000000000000..33ca3bb9e64aec66af7a7afb2f8458554e9639f3 --- /dev/null +++ b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4fe28ec5a9a880d48b1d51513dc5020f00ee752345a81924248653c69e935c +size 31494360 diff --git a/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst new file mode 100644 index 0000000000000000000000000000000000000000..8ebaa22167e89669041e0b5fe1c238c572c78d98 --- /dev/null +++ b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bca2c247191ff4cad5d5a3d224d3a7c3394e140d55ea87d52e46a7824d1f00c3 +size 990731584 diff --git a/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state new file mode 100644 index 0000000000000000000000000000000000000000..12e32e37d640fd944dc992e548e5335190db5435 --- /dev/null +++ b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6b1af0fee539884ba41a2fdb91c4bd58e541182d17d8022bf30e0287e11ecd1 +size 9864837 diff --git a/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super new file mode 100644 index 0000000000000000000000000000000000000000..367bbc2c48c9cee8db99bdc58c8f02c79d257c1d --- /dev/null +++ b/unet/dd/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1248c187b5b209a54a2555d999a0a774ce336d9a22fb136550232f079df36dc9 +size 1046920 diff --git a/unet/dd/onnx_report.txt b/unet/dd/onnx_report.txt new file mode 100644 index 0000000000000000000000000000000000000000..7cdfbf127d1eef6d3be39e909ed17c9e90dbf75c --- /dev/null +++ b/unet/dd/onnx_report.txt @@ -0,0 +1,58 @@ + DynamicDispatch Offload - not offloaded ++-------------------+-------+------------------------+------------------------+ +| Op Type | Count | Inputs | Outputs | ++===================+=======+========================+========================+ +| Cast | 1 | [2,1] - DOUBLE | [2,1] - FLOAT | +| CastAvx | 1 | [2,64,64,4] - FLOAT | [2,64,64,4] - BFLOAT16 | +| CastAvx | 1 | [2,77,768] - FLOAT | [2,77,768] - BFLOAT16 | +| CastAvx | 1 | [2,320] - FLOAT | [2,320] - BFLOAT16 | +| CastAvx | 1 | [2,64,64,4] - BFLOAT16 | [2,64,64,4] - FLOAT | +| Concat | 1 | [2,160] - FLOAT | [2,320] - FLOAT | +| | | [2,160] - FLOAT | | +| Cos | 1 | [2,160] - FLOAT | [2,160] - FLOAT | +| Expand | 1 | [1] - DOUBLE | [2] - DOUBLE | +| | | [1] - INT64 | | +| Mul | 1 | [2,1] - FLOAT | [2,160] - FLOAT | +| | | [1,160] - FLOAT | | +| Reshape | 1 | [2] - DOUBLE | [2,1] - DOUBLE | +| | | [2] - INT64 | | +| Sin | 1 | [2,160] - FLOAT | [2,160] - FLOAT | +| Transpose | 1 | [2,4,64,64] - FLOAT | [2,64,64,4] - FLOAT | +| Transpose | 1 | [2,64,64,4] - FLOAT | [2,4,64,64] - FLOAT | ++-------------------+-------+------------------------+------------------------+ +| Not offloaded sum | 13 | | | ++-------------------+-------+------------------------+------------------------+ + DynamicDispatch Offload - offloaded ++-------------------+-----------------+-------------------+-------------------+ +| Op Type | Count | Inputs | Outputs | ++===================+=================+===================+===================+ +| DynamicDispatch | 1 | [2,64,64,4] - | [2,64,64,4] - | +| | | BFLOAT16 | BFLOAT16 | +| | | [2,77,768] - | | +| | | BFLOAT16 | | +| | | [2,320] - | | +| | | BFLOAT16 | | ++-------------------+-----------------+-------------------+-------------------+ +| Offloaded sum | 1 | | | ++-------------------+-----------------+-------------------+-------------------+ +| Offloaded Op | SDMHA_bfp | | | +| Types | SDResize_bfp | | | +| | SDConv | | | +| | SDGemm | | | +| | SDCastBfp2Bf | | | +| | SDAdd_bfp | | | +| | SDConcat_bfp | | | +| | SDFlatMHA | | | +| | SDSilu | | | +| | SDGemm_bfp | | | +| | SDMul_bfp | | | +| | SDGroupNorm_bfp | | | +| | SDCastBf2Bfp | | | +| | SDConv_bfp | | | +| | SDLayerNorm_bfp | | | ++-------------------+-----------------+-------------------+-------------------+ +| Offloaded sum (dd | 618 | | | +| fusion) | | | | +| Offload Ratio (dd | 97.94% | | | +| fusion) | | | | ++-------------------+-----------------+-------------------+-------------------+ diff --git a/unet/dd/replaced.onnx b/unet/dd/replaced.onnx new file mode 100644 index 0000000000000000000000000000000000000000..b44d4ba68b3516f6bfe42c2f0034b09abe7a369e --- /dev/null +++ b/unet/dd/replaced.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b6ad2995d946d991520b77d112493a42d1e3e7d53fc55519c16357fdd9927a +size 582744 diff --git a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt b/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt deleted file mode 100644 index c4ee33782d2e332e2136b7ce018fcd2eb0e85ba9..0000000000000000000000000000000000000000 --- a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.ctrlpkt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:48547214fbff1161a46e43c00f93f8715cc3c929cde451d80aa3bb0b1236bc02 -size 32919360 diff --git a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst b/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst deleted file mode 100644 index 96a9b87a0c1896daef1b1f5028f7cd77ba05bb24..0000000000000000000000000000000000000000 --- a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.fconst +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8ba147867685fb38b560328fd74ac596f98bf3512ed599cf1bc51642b8166b02 -size 990629184 diff --git a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state b/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state deleted file mode 100644 index 2689e3411a780fddb5b2ca53bac6ba63caff5b29..0000000000000000000000000000000000000000 --- a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.state +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e897be73fc881906a360e2013784c34e7be77e4bd4b63d644813e5f39c999885 -size 10390907 diff --git a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super b/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super deleted file mode 100644 index 2751b6f0a1e7dcc48735603d808f10763e1b5477..0000000000000000000000000000000000000000 --- a/unet/dd_metastate_SD15_Unet_NhwcConv_0-conv_inConv.super +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a2eb5395c916b181067e17a3ea2c47c13326ab59169fdc6f7fa1295d09ed7a22 -size 997128 diff --git a/unet/model_NCHW.onnx b/unet/model_NCHW.onnx deleted file mode 100644 index 3ec54315b254559adb6a747e93780fc412e0a661..0000000000000000000000000000000000000000 --- a/unet/model_NCHW.onnx +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8c93efa63475ca1ff7b813542fd4532e1637fff1efe362335d07427e6ce1e9d5 -size 38301 diff --git a/unet/model_NHWC.onnx b/unet/model_NHWC.onnx deleted file mode 100644 index 0dfed19e9d011b043ec5b54437d50a7843428d5c..0000000000000000000000000000000000000000 --- a/unet/model_NHWC.onnx +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:bc6bccf7bc6322864397d0b44159471137db857f167129a55d5db0ec5761759e -size 38020 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_0.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_0.const deleted file mode 100644 index 33958b81fcadae712ed4c15efae9bb200eddbf74..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_0.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_1.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_1.const deleted file mode 100644 index d359d17674291fb17633e04f2c49206169b45039..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_1.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_10.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_10.const deleted file mode 100644 index 1a1f3c5aef84d24dccdd7de96a8d9c22131e00cb..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_10.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b132a2c946d7a90a654d4da2df6f8e363a3b6149244e121d3bf77365ebc6008d -size 299008 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_100.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_100.const deleted file mode 100644 index b92bd6bb006ea9081b8b9970583b3bb7e610da92..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_100.const +++ /dev/null @@ -1 +0,0 @@ -1??*?H?r?L?r?E?h?~?^?_?T?P?>?W?E?z??u?k?q?H?}?R?w??g??>?D???z?r?i?V???m?H?>?e?t?a?|?P?U?q?T?q?Z?J?J??M?P??0?.?>?e?*?g?V?F?`?#?r?k?t?0??@?i?8?o?g??4?=??u?j?|?{?j?9?[?T?X?@???3?n?A?"?v?R?P?K?c?5??W?K???g?`???U?d???9?S?x?k?@?c?t??Q?|?Y??:߽Ž!=һmi//Ϻ>Ž*?GO¼V4K4\15*<ʽϹཤȼ'Ͻ<½<u2Hrj;?p?>???>z??+??f?#?g?w?k??>?$?!????/?.?-??@?=?@?@?M?@?>?C?A?H?+?@?@?,?4?F?>?D?0?7?.?A?2?;?5????> ??>?}?x??!?x?>??+?G?3??"?+?!?0?)?A?+?7?*?7?/?5?2?+?.?!?.?;??'?+?=?/?(?(?8?)?-?j?>?>?w???>?????[??5??4??#?.?0?.?+?%?6?&?;?2?+?'?1?.?!??(??0?&??8?0??$?-?*?!?!?!?+? ?'?'???@?O?=?*?%?$?L?&?e?-?v?%???=????r?7????>?t?????%??A?&?B?#?i?>???? ?+?&???J??%??eҾܾ龵˽Gy=DԽ񽴽ٽ=νܽA}@=vŽ -{nӽҽ۽ͽ=G=zV:[=wH(cپQ^ (ս}=̽ԽٽϽڽӽѽս=齞ڽн̽qei۾޾iO?=ȽýֽݽؽQ=뽩ͽʽŽڽ*(G1=67=41904*gb}ξtH9վeپV=нȽͽླྀɽսȽý˼v@pl=ӾEо^ѾϾpj#V׽=ƽƽǽֽܽνi= -D(G'9=S$$GU!$=Žѽʽp]=_k8=}~:=gj(`ZPu:S= - ʽнԽ =HFȾ=nzhS5f˽Ovynf -Žh=zw½ \ No newline at end of file diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_3.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_3.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_3.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_30.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_30.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_30.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_31.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_31.const deleted file mode 100644 index a15c4b90ec23d896606f9d2bee45e61c254a6236..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_31.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:9de51f0bfbde9c1dcd89bf10d276834169102130fdb2d7862c604410847b4337 -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_32.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_32.const deleted file mode 100644 index d121c85da8a8b2dd8a90502686845418e6e2daba..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_32.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_33.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_33.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_33.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_34.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_34.const deleted file mode 100644 index 3bb06d8f6a35c13fbf730073e2ca1ba6182d19a4..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_34.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:438dc5020724390bad099179e128084793bf0bd64c89b220881ae93ef645617e -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_35.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_35.const deleted file mode 100644 index 539659920a86e6c15a38f9fa9a309d452769d917..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_35.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_36.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_36.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_36.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_37.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_37.const deleted file mode 100644 index 507048e9e4982e975be1ad425423ed4477d62bcd..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_37.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0447151bb8ca42b081a7abbf29326a1762febb6dc16ce0a6b5ac5269081cd385 -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_38.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_38.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_38.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_39.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_39.const deleted file mode 100644 index 40464ff6bb7137d5d2fe8fd3244d6fcd31fb9683..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_39.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6c1c330d24555ddd0c2e014ed03043917bf8913222b81283f9c7054913b3492e -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_4.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_4.const deleted file mode 100644 index d5237db5ef016105af543004aecde5ab0786e56b..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_4.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:b4aef5e03c44f14ffaefb9e24c703d3b921c9528478db357fbf7d99abfd2748e -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_40.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_40.const deleted file mode 100644 index 97346da76af83a62b0523d209b0004762045468b..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_40.const +++ /dev/null @@ -1 +0,0 @@ -??d?Q???X???s?X?Q?f??j?e???????t?P?l???b??u????v?h??i?_?????l????{?g??P??S?z??????c??????L??r??w???l?\?r?c??a?{?>?]???X???b????m???}???????P?????????]????????d?|??_???z????j??P?H??R?h?F?R?i?'?Q?B?L??d?X?~??~?r??\?Z?|??s????W??~?x??{??u?????a???S??e??}???????????}???u???i??????y??q???U?j??~???n?????h?}???V???????}?v?????????j???_??i???s??~?q??g?q?c?b????u??}?}?L????]????q??o??i?t?b???x?x?O???5????n?a?c?M?s?Q?O?X?\?@?V?b?V?h?T?]???h?Z?n???c??X??????v?o???N???????o?X????g?\??e????~??i???N?E??t??c??>^?m?{?S?o?k?y?z?i?f?n?q??`?h?p?v?[??b?`?M?h?j?h?i?h?8??Y????????????w?p?n?????p???l??????U???n???x?t??????e??b???h?b??|?V?z???????u?????y??\???????v?l??r?????`?>@?@???V??.?Z?\?J?C?P?+?)?????v?r???U??????V??N?l??>u??h?u?l?F??B?T?u?d??|J{Wj^FUtgtrAexrtMk]eho_Y]|dM vDqIv'nWdyOtJQɽ{???G????????_????????m???9??d???>???-?Z???Q?>???d?k???m??7???????5??6??????Q?\?j??????R?k??t??n?v?Q??:???[???&????-??????O??g????s???T?? ?I???????b?????X???-?I?x??y???.??????????S?+?#????????T?6??*? ?????J????2?.????2????4???E?>???@?|??*??W????4????a???O?E?O??T???E???D?C??X??Q??1?????????+??????Q???T??m?f???t?v?^???o??H?S??W?_??=?K???y?????@??D??B?_?Q?A?i?j???n??}?s????O?M??????;??j???:?????:?n??gswkؾɾDپ־ɾȾmgžtyrѾTo־ZھzоT*Fkξƾ(Xjþ;ϾS] Ͼվ꾽ݾEi־ھɾ^bþҾh ݾ꾫_nϾ۾Pоp˾辈K_̾ž辯ھvX޾ľᾛ׾5ݾ~0þi?7Qھվ`̾c¾ž]pI{FO~{ھoaɾIc&:ľ¾ξɾҾ߾cξҾӾɾixM\oϾپ.wо0˾Ծ\2G߾\ԾҾ0羙Ӿ.]ľɾ@Ǿھ⾨WC⾲Ͼsľξ¾RQ$;d???u?y?}?u?m?s?g?u?y?3?]?k?h?|?`??u?h?E?_?u?j?u?u?&?p?x??|?n?o???s??l?m?o?r?z?o??????~?n?v??Z??w?????|?v?g?m?p????v?w?]?V?n???Z?i??p?w???g??h???{????x?{??????{??}?y?h??j?????p??j?6??&?t? -?L?n?s?j?h?r?Q?(??h??c??{????z??|?|??x?x?a?x?? ?v??~??{?l??C?p??x?~? %}Z5cytdu|hZnQiY|ibdweS -K|_y#-ӽ eiQo$>;AE]F8@N2OGJ0J.MeUcED`T{bYYwdFb`\Z@;;E?_&3`f*:E14RMu[hy*Na=rLLux`ABl@QHuPds.bx_DbuQE1@cVZmR޽J[`LX5@)#T6սsElr{RuFCqi55.fy XFzWg~y]RԽ^nd^K\;gSxjoUg6-~iRj>"nyBM?o':*>CYJxm^pN//p5">SULJyYHK?exgHQdFUXSD 2 <ȽWDX/㽑2 "Ͻ -i[0%UU, 1PmnNWv|b(Afhfqc !M=N]h^lvH4xQOrSM[J;X<,=DNNwxH9]ir5XiؾF[uݾ޽޽~1#nv7ORj|hg@lJξ ܽɽD& \ No newline at end of file diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_53.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_53.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_53.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_54.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_54.const deleted file mode 100644 index dcd9a194dac7bee364257c60ee393d26657453fa..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_54.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:cb8f973d10ceec12a5ab1217e67c2ed5b206c6f1a5dab7aaa8ddfafcc35dbf2f -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_55.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_55.const deleted file mode 100644 index 50bd493eaf270f05d376974f3814b57624bb34c3..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_55.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_56.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_56.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_56.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_57.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_57.const deleted file mode 100644 index 5c339160be3e87e9b1167fd25be997a6cf53ffd5..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_57.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:6dfe148c6241538e0bbf0e647b1707f16bf586eea2e22f2b84df289be7ec6b0b -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_58.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_58.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_58.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_59.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_59.const deleted file mode 100644 index 3c2b7866b243ae14b9b3686fc9e89fd7dcd81a9f..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_59.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ebe2f979fca8555235041e584da567dc153a8f64c51cd22d72fc8f7f158314f0 -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_6.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_6.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_6.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_60.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_60.const deleted file mode 100644 index 4bc344ec8c4189b2d8d33177fea94002aa078933..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_60.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_61.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_61.const deleted file mode 100644 index c785f3fa01efd87f5eb87baf02f64574094086a8..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_61.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:365fa8495ca4144322ed9708cfe32f2e688fe3e06edf25bedc3d8c6ffaf26c3f -size 163840 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_62.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_62.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_62.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_63.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_63.const deleted file mode 100644 index 3385ca9b292f22d7ab7bf2b9d85e3dcbe5ae99df..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_63.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:5521794d85ef3c12f7723038fb436c4bcbc937c288bd85956d67b01abff7211f -size 1392640 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_64.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_64.const deleted file mode 100644 index 0d9a39fc4de2aa4a9b4fdbaae881aaab60a5b6b8..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_64.const +++ /dev/null @@ -1 +0,0 @@ -R????@?i??{?????????????????????????????????????????????????????????????????????????????????????????????????????????????????p?m?????w?Q?????????Z?????????s?????z????????????????????????????????????[??~??_?s???????????????v?????????????????????????????????????????????w?????x79,E&HZ\xOu}[LI$3,,(w=Y75LGsce^½½߼ν˽t`>EhPP@R'ǽ':8!7P>\tν̽:<ɽ缑q ro̽_0Qd>/B@)a579`7- z,4+ҽP۽ \ No newline at end of file diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_65.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_65.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_65.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_66.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_66.const deleted file mode 100644 index e7029f98bb47e3f71c8b22d53675a2bc3dc0920d..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_66.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:8a9a898fc31011ee674686b8e252db344240eab4e5d694c0f19bc0fdd6f70400 -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_67.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_67.const deleted file mode 100644 index 701d1287999cb3fae1b5531dd7c4044495c95b7e..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_67.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_68.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_68.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_68.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_69.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_69.const deleted file mode 100644 index d7ea6d1ed36129e777fa2199ab949b7f13642bf2..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_69.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:a6e384ddc4141be48cc2373f89be3fbb49f867a159de51c564d98019b8d4d842 -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_7.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_7.const deleted file mode 100644 index 9ebf08b7695ca29458e02b87e8388a3d1491c583..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_7.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:e2aa040c58d5d4e42db2577b4375776b8bf7dae287f5808f68cca450d2975f97 -size 2785280 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_70.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_70.const deleted file mode 100644 index 564b9201aabdbcd71084edbe6e45df72dd22f2e4..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_70.const +++ /dev/null @@ -1,5 +0,0 @@ -????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????G????????+n=6q?FoWa -54Q#DcQMIF(OJXBGnW_Q?^+9,_Z<@MZbl%bcZ;lERw`!P;ESJŽIbf<*P=?jkIsLDPQ;@ 7lm -3bѽ)X+iajP[dBjaOC(z8y(!URbc"'RKt8V/]CO19Aai -p7(2Fik;?:S -X >SeQn1C6J=Vu罃v;H'a_B?lWUhGB!I@L=AXEDNf1~c).M %c, 󽷽 \ No newline at end of file diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_71.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_71.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_71.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_72.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_72.const deleted file mode 100644 index 4e1f791266a57840803afc87547d1504966d4cde..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_72.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:05be2356504faa828405db66fd5361f0040ff63dc6653f08030beb6ddd232f1b -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_73.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_73.const deleted file mode 100644 index ea3a2ca3c0ff8ca59f99f7f8e4c013e045a8c66e..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_73.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_74.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_74.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_74.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_75.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_75.const deleted file mode 100644 index fdd0d698e916a44232ec6d94a1d7e89d84255209..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_75.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:772ac43a6a0a2d7e1033c04ca33b5b84d5636731f07322f6b7eabb8919d1158b -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_76.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_76.const deleted file mode 100644 index 8a798288d6546d8707e9a4312a0d8b46dd6513ce..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_76.const +++ /dev/null @@ -1 +0,0 @@ -??????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????j??????????????????????????????????????????????????????????????????????????????????hI%m{z_Dn ._y^J\HAŽĽ?0-`Zw{E*OC((/s*CV6|r;J;ty \ No newline at end of file diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_77.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_77.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_77.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_78.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_78.const deleted file mode 100644 index 5037b53a977725b3475eb6b09bccfffa85990d13..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_78.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:890bdf706b2d985d4f94e340b872d9b49dbf53efebe58214803a61f6816077ad -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_79.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_79.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_79.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_8.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_8.const deleted file mode 100644 index 097d6d1766eab9795c26d2cb889c6bf1ef51aa87..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_8.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_80.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_80.const deleted file mode 100644 index 42e054dc60f8d6fc252269d3af3b3c77af83169c..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_80.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:0db1be880cba8928b8a26ea82b01f93e9cf51f2624f0abc90b69c2eea9a3b257 -size 696320 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_81.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_81.const deleted file mode 100644 index 1fefa6765d26752dfb4f7614867fa6413089cd47..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_81.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_82.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_82.const deleted file mode 100644 index a05b9aca790303874d1e31069d1a15bddc659a17..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_82.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_83.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_83.const deleted file mode 100644 index 65f57c2ee985713476ac0b6e3483e6fe472e2176..0000000000000000000000000000000000000000 Binary files a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_83.const and /dev/null differ diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_84.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_84.const deleted file mode 100644 index 715184a579ff08e3b79556fa5ba04c8c9ea92758..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_84.const +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c3f47738fdcdf372f3be1f5ec7a938237d22a15e8530f6efb8659d293c0f238c -size 348160 diff --git a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_85.const b/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_85.const deleted file mode 100644 index 76a03645dafa664556086315e45b8dad69d901d4..0000000000000000000000000000000000000000 --- a/vae_decoder/.cache/NhwcConv_0-post_quant_convConv_85.const +++ /dev/null @@ -1 +0,0 @@ -????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????????^==@