diff --git "a/vae_decoder/RyzenAI/.cache/NhwcConv_0-post_quant_convConv_meta.json" "b/vae_decoder/RyzenAI/.cache/NhwcConv_0-post_quant_convConv_meta.json" new file mode 100644--- /dev/null +++ "b/vae_decoder/RyzenAI/.cache/NhwcConv_0-post_quant_convConv_meta.json" @@ -0,0 +1,12160 @@ +{ + "dd_meta_major_version": 1, + "dd_meta_minor_version": 2, + "state_table_updates": [], + "op_list": [ + { + "name": "NhwcConv_0-/post_quant_conv/Conv", + "type": "SDConv", + "in_args": [ + "Transpose_0_out-latents.out0_1_0" + ], + "const_args": [ + "NhwcConv_0_weight_NHWC" + ], + "out_args": [ + "NhwcConv_0_out-/post_quant_conv/Conv_output_0.out0_1_0" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "4" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "4" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "4", + "1", + "1", + "4" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_1-/decoder/conv_in/Conv", + "type": "SDConv", + "in_args": [ + "NhwcConv_0_out-/post_quant_conv/Conv_output_0.out0_1_0" + ], + "const_args": [ + "NhwcConv_1_weight_NHWC" + ], + "out_args": [ + "NhwcConv_1_out-/decoder/conv_in/Conv_output_0.out0_1_1" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "4" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "4" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_0", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_1_out-/decoder/conv_in/Conv_output_0.out0_1_1" + ], + "const_args": [ + "GroupNorm_0_wts_7_1_0" + ], + "out_args": [ + "GroupNorm_0.out9_0.out7_1_0" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_0", + "type": "SDSilu", + "in_args": [ + "GroupNorm_0.out9_0.out7_1_0" + ], + "const_args": [ + "Sigmoid_0.weights9_0" + ], + "out_args": [ + "GroupNorm_0_sigmoid_out.9_0.out9_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_2-/decoder/mid_block/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_0_sigmoid_out.9_0.out9_0" + ], + "const_args": [ + "NhwcConv_2_weight_NHWC" + ], + "out_args": [ + "NhwcConv_2_out-/decoder/mid_block/resnets.0/conv1/Conv_output_0.out0_1_2" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_1", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_2_out-/decoder/mid_block/resnets.0/conv1/Conv_output_0.out0_1_2" + ], + "const_args": [ + "GroupNorm_1_wts_7_1_1" + ], + "out_args": [ + "GroupNorm_1.out9_1.out7_1_1" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_1", + "type": "SDSilu", + "in_args": [ + "GroupNorm_1.out9_1.out7_1_1" + ], + "const_args": [ + "Sigmoid_1.weights9_1" + ], + "out_args": [ + "GroupNorm_1_sigmoid_out.9_1.out9_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_3-/decoder/mid_block/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_1_sigmoid_out.9_1.out9_1" + ], + "const_args": [ + "NhwcConv_3_weight_NHWC" + ], + "out_args": [ + "NhwcConv_3_out-/decoder/mid_block/resnets.0/conv2/Conv_output_0.out0_1_3" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_1_out-/decoder/conv_in/Conv_output_0.out0_1_1", + "NhwcConv_3_out-/decoder/mid_block/resnets.0/conv2/Conv_output_0.out0_1_3" + ], + "const_args": [], + "out_args": [ + "/decoder/mid_block/resnets.0/Add.out_4_1_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_2", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/mid_block/resnets.0/Add.out_4_1_0" + ], + "const_args": [ + "GroupNorm_2_wts_7_0_0" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/to_k/MatMul", + "type": "SDGemm", + "in_args": [ + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0" + ], + "const_args": [ + "onnx::MatMul_918" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/to_k/Add_output_0.out2_3_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "512" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/to_q/MatMul", + "type": "SDGemm", + "in_args": [ + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0" + ], + "const_args": [ + "onnx::MatMul_917" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/to_q/Add_output_0.out2_3_1" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "512" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/to_v/MatMul", + "type": "SDGemm", + "in_args": [ + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0" + ], + "const_args": [ + "onnx::MatMul_919" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/to_v/Add_output_0.out2_3_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "512" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/MatMulmha_1_0", + "type": "SDMHA", + "in_args": [ + "/decoder/mid_block/attentions.0/to_q/Add_output_0.out2_3_1", + "/decoder/mid_block/attentions.0/to_k/Add_output_0.out2_3_0", + "/decoder/mid_block/attentions.0/to_v/Add_output_0.out2_3_2" + ], + "const_args": [ + "/decoder/mid_block/attentions.0/MatMulmha_1_0_mask.13_0" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/Reshape_4_output_0.out13_0" + ], + "attrs": { + "num_heads": { + "type": "int", + "value": [ + "1" + ] + }, + "unidirectional": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512", + "4096" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/to_out.0/MatMul", + "type": "SDGemm", + "in_args": [ + "/decoder/mid_block/attentions.0/Reshape_4_output_0.out13_0" + ], + "const_args": [ + "onnx::MatMul_927" + ], + "out_args": [ + "/decoder/mid_block/attentions.0/Reshape_5_output_0.nhwc3_0.out2_0_0" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "4096", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "512" + ] + }, + "bias_enable": { + "type": "int", + "value": [ + "1" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/attentions.0/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/mid_block/attentions.0/Reshape_5_output_0.nhwc3_0.out2_0_0", + "/decoder/mid_block/resnets.0/Add.out_4_1_0" + ], + "const_args": [], + "out_args": [ + "/decoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_3", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_1" + ], + "const_args": [ + "GroupNorm_3_wts_7_1_2" + ], + "out_args": [ + "GroupNorm_3.out9_3.out7_1_2" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_2", + "type": "SDSilu", + "in_args": [ + "GroupNorm_3.out9_3.out7_1_2" + ], + "const_args": [ + "Sigmoid_2.weights9_2" + ], + "out_args": [ + "GroupNorm_3_sigmoid_out.9_3.out9_2" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_4-/decoder/mid_block/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_3_sigmoid_out.9_3.out9_2" + ], + "const_args": [ + "NhwcConv_4_weight_NHWC" + ], + "out_args": [ + "NhwcConv_4_out-/decoder/mid_block/resnets.1/conv1/Conv_output_0.out0_1_4" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_4", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_4_out-/decoder/mid_block/resnets.1/conv1/Conv_output_0.out0_1_4" + ], + "const_args": [ + "GroupNorm_4_wts_7_1_3" + ], + "out_args": [ + "GroupNorm_4.out9_4.out7_1_3" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_3", + "type": "SDSilu", + "in_args": [ + "GroupNorm_4.out9_4.out7_1_3" + ], + "const_args": [ + "Sigmoid_3.weights9_3" + ], + "out_args": [ + "GroupNorm_4_sigmoid_out.9_4.out9_3" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_5-/decoder/mid_block/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_4_sigmoid_out.9_4.out9_3" + ], + "const_args": [ + "NhwcConv_5_weight_NHWC" + ], + "out_args": [ + "NhwcConv_5_out-/decoder/mid_block/resnets.1/conv2/Conv_output_0.out0_1_5" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/mid_block/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_1", + "NhwcConv_5_out-/decoder/mid_block/resnets.1/conv2/Conv_output_0.out0_1_5" + ], + "const_args": [], + "out_args": [ + "/decoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_5", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_2" + ], + "const_args": [ + "GroupNorm_5_wts_7_1_4" + ], + "out_args": [ + "GroupNorm_5.out9_5.out7_1_4" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_4", + "type": "SDSilu", + "in_args": [ + "GroupNorm_5.out9_5.out7_1_4" + ], + "const_args": [ + "Sigmoid_4.weights9_4" + ], + "out_args": [ + "GroupNorm_5_sigmoid_out.9_5.out9_4" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_6-/decoder/up_blocks.0/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_5_sigmoid_out.9_5.out9_4" + ], + "const_args": [ + "NhwcConv_6_weight_NHWC" + ], + "out_args": [ + "NhwcConv_6_out-/decoder/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_6" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_6", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_6_out-/decoder/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_6" + ], + "const_args": [ + "GroupNorm_6_wts_7_1_5" + ], + "out_args": [ + "GroupNorm_6.out9_6.out7_1_5" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_5", + "type": "SDSilu", + "in_args": [ + "GroupNorm_6.out9_6.out7_1_5" + ], + "const_args": [ + "Sigmoid_5.weights9_5" + ], + "out_args": [ + "GroupNorm_6_sigmoid_out.9_6.out9_5" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_7-/decoder/up_blocks.0/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_6_sigmoid_out.9_6.out9_5" + ], + "const_args": [ + "NhwcConv_7_weight_NHWC" + ], + "out_args": [ + "NhwcConv_7_out-/decoder/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_7" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.0/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_2", + "NhwcConv_7_out-/decoder/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_7" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.0/resnets.0/Add_output_0_NHWC.out_4_1_3" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_7", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.0/resnets.0/Add_output_0_NHWC.out_4_1_3" + ], + "const_args": [ + "GroupNorm_7_wts_7_1_6" + ], + "out_args": [ + "GroupNorm_7.out9_7.out7_1_6" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_6", + "type": "SDSilu", + "in_args": [ + "GroupNorm_7.out9_7.out7_1_6" + ], + "const_args": [ + "Sigmoid_6.weights9_6" + ], + "out_args": [ + "GroupNorm_7_sigmoid_out.9_7.out9_6" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_8-/decoder/up_blocks.0/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_7_sigmoid_out.9_7.out9_6" + ], + "const_args": [ + "NhwcConv_8_weight_NHWC" + ], + "out_args": [ + "NhwcConv_8_out-/decoder/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_8" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_8", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_8_out-/decoder/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_8" + ], + "const_args": [ + "GroupNorm_8_wts_7_1_7" + ], + "out_args": [ + "GroupNorm_8.out9_8.out7_1_7" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_7", + "type": "SDSilu", + "in_args": [ + "GroupNorm_8.out9_8.out7_1_7" + ], + "const_args": [ + "Sigmoid_7.weights9_7" + ], + "out_args": [ + "GroupNorm_8_sigmoid_out.9_8.out9_7" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_9-/decoder/up_blocks.0/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_8_sigmoid_out.9_8.out9_7" + ], + "const_args": [ + "NhwcConv_9_weight_NHWC" + ], + "out_args": [ + "NhwcConv_9_out-/decoder/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_9" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.0/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.0/resnets.0/Add_output_0_NHWC.out_4_1_3", + "NhwcConv_9_out-/decoder/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_9" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.0/resnets.1/Add_output_0_NHWC.out_4_1_4" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_9", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.0/resnets.1/Add_output_0_NHWC.out_4_1_4" + ], + "const_args": [ + "GroupNorm_9_wts_7_1_8" + ], + "out_args": [ + "GroupNorm_9.out9_9.out7_1_8" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_8", + "type": "SDSilu", + "in_args": [ + "GroupNorm_9.out9_9.out7_1_8" + ], + "const_args": [ + "Sigmoid_8.weights9_8" + ], + "out_args": [ + "GroupNorm_9_sigmoid_out.9_9.out9_8" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_10-/decoder/up_blocks.0/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_9_sigmoid_out.9_9.out9_8" + ], + "const_args": [ + "NhwcConv_10_weight_NHWC" + ], + "out_args": [ + "NhwcConv_10_out-/decoder/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_10" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_10", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_10_out-/decoder/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_10" + ], + "const_args": [ + "GroupNorm_10_wts_7_1_9" + ], + "out_args": [ + "GroupNorm_10.out9_10.out7_1_9" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_9", + "type": "SDSilu", + "in_args": [ + "GroupNorm_10.out9_10.out7_1_9" + ], + "const_args": [ + "Sigmoid_9.weights9_9" + ], + "out_args": [ + "GroupNorm_10_sigmoid_out.9_10.out9_9" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_11-/decoder/up_blocks.0/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_10_sigmoid_out.9_10.out9_9" + ], + "const_args": [ + "NhwcConv_11_weight_NHWC" + ], + "out_args": [ + "NhwcConv_11_out-/decoder/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_11" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.0/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.0/resnets.1/Add_output_0_NHWC.out_4_1_4", + "NhwcConv_11_out-/decoder/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_11" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.0/resnets.2/Add_output_0.nhwc2_0.out_4_1_5" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.0/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/decoder/up_blocks.0/resnets.2/Add_output_0.nhwc2_0.out_4_1_5" + ], + "const_args": [ + "/decoder/up_blocks.0/upsamplers.0/Resize.weights10_0" + ], + "out_args": [ + "/decoder/up_blocks.0/upsamplers.0/Resize_output_0.nhwc2_0.out_10_0" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "64", + "64", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_12-/decoder/up_blocks.0/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/decoder/up_blocks.0/upsamplers.0/Resize_output_0.nhwc2_0.out_10_0" + ], + "const_args": [ + "NhwcConv_12_weight_NHWC" + ], + "out_args": [ + "NhwcConv_12_out-/decoder/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_12" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_11", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_12_out-/decoder/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_12" + ], + "const_args": [ + "GroupNorm_11_wts_7_1_10" + ], + "out_args": [ + "GroupNorm_11.out9_11.out7_1_10" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_10", + "type": "SDSilu", + "in_args": [ + "GroupNorm_11.out9_11.out7_1_10" + ], + "const_args": [ + "Sigmoid_10.weights9_10" + ], + "out_args": [ + "GroupNorm_11_sigmoid_out.9_11.out9_10" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_13-/decoder/up_blocks.1/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_11_sigmoid_out.9_11.out9_10" + ], + "const_args": [ + "NhwcConv_13_weight_NHWC" + ], + "out_args": [ + "NhwcConv_13_out-/decoder/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_13" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_12", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_13_out-/decoder/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_13" + ], + "const_args": [ + "GroupNorm_12_wts_7_1_11" + ], + "out_args": [ + "GroupNorm_12.out9_12.out7_1_11" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_11", + "type": "SDSilu", + "in_args": [ + "GroupNorm_12.out9_12.out7_1_11" + ], + "const_args": [ + "Sigmoid_11.weights9_11" + ], + "out_args": [ + "GroupNorm_12_sigmoid_out.9_12.out9_11" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_14-/decoder/up_blocks.1/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_12_sigmoid_out.9_12.out9_11" + ], + "const_args": [ + "NhwcConv_14_weight_NHWC" + ], + "out_args": [ + "NhwcConv_14_out-/decoder/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_14" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.1/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_12_out-/decoder/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_12", + "NhwcConv_14_out-/decoder/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_14" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.1/resnets.0/Add.out_4_1_6" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_13", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.1/resnets.0/Add.out_4_1_6" + ], + "const_args": [ + "GroupNorm_13_wts_7_1_12" + ], + "out_args": [ + "GroupNorm_13.out9_13.out7_1_12" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_12", + "type": "SDSilu", + "in_args": [ + "GroupNorm_13.out9_13.out7_1_12" + ], + "const_args": [ + "Sigmoid_12.weights9_12" + ], + "out_args": [ + "GroupNorm_13_sigmoid_out.9_13.out9_12" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_15-/decoder/up_blocks.1/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_13_sigmoid_out.9_13.out9_12" + ], + "const_args": [ + "NhwcConv_15_weight_NHWC" + ], + "out_args": [ + "NhwcConv_15_out-/decoder/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_15" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_14", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_15_out-/decoder/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_15" + ], + "const_args": [ + "GroupNorm_14_wts_7_1_13" + ], + "out_args": [ + "GroupNorm_14.out9_14.out7_1_13" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_13", + "type": "SDSilu", + "in_args": [ + "GroupNorm_14.out9_14.out7_1_13" + ], + "const_args": [ + "Sigmoid_13.weights9_13" + ], + "out_args": [ + "GroupNorm_14_sigmoid_out.9_14.out9_13" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_16-/decoder/up_blocks.1/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_14_sigmoid_out.9_14.out9_13" + ], + "const_args": [ + "NhwcConv_16_weight_NHWC" + ], + "out_args": [ + "NhwcConv_16_out-/decoder/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_16" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.1/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.1/resnets.0/Add.out_4_1_6", + "NhwcConv_16_out-/decoder/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_16" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.1/resnets.1/Add.out_4_1_7" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_15", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.1/resnets.1/Add.out_4_1_7" + ], + "const_args": [ + "GroupNorm_15_wts_7_1_14" + ], + "out_args": [ + "GroupNorm_15.out9_15.out7_1_14" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_14", + "type": "SDSilu", + "in_args": [ + "GroupNorm_15.out9_15.out7_1_14" + ], + "const_args": [ + "Sigmoid_14.weights9_14" + ], + "out_args": [ + "GroupNorm_15_sigmoid_out.9_15.out9_14" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_17-/decoder/up_blocks.1/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_15_sigmoid_out.9_15.out9_14" + ], + "const_args": [ + "NhwcConv_17_weight_NHWC" + ], + "out_args": [ + "NhwcConv_17_out-/decoder/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_17" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_16", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_17_out-/decoder/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_17" + ], + "const_args": [ + "GroupNorm_16_wts_7_1_15" + ], + "out_args": [ + "GroupNorm_16.out9_16.out7_1_15" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_15", + "type": "SDSilu", + "in_args": [ + "GroupNorm_16.out9_16.out7_1_15" + ], + "const_args": [ + "Sigmoid_15.weights9_15" + ], + "out_args": [ + "GroupNorm_16_sigmoid_out.9_16.out9_15" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_18-/decoder/up_blocks.1/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_16_sigmoid_out.9_16.out9_15" + ], + "const_args": [ + "NhwcConv_18_weight_NHWC" + ], + "out_args": [ + "NhwcConv_18_out-/decoder/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_18" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.1/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.1/resnets.1/Add.out_4_1_7", + "NhwcConv_18_out-/decoder/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_18" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.1/resnets.2/Add.out_4_1_8" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.1/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/decoder/up_blocks.1/resnets.2/Add.out_4_1_8" + ], + "const_args": [ + "/decoder/up_blocks.1/upsamplers.0/Resize.weights10_1" + ], + "out_args": [ + "/decoder/up_blocks.1/upsamplers.0/Resize_output_0.nhwc2_1.out_10_1" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "128", + "128", + "512" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_19-/decoder/up_blocks.1/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/decoder/up_blocks.1/upsamplers.0/Resize_output_0.nhwc2_1.out_10_1" + ], + "const_args": [ + "NhwcConv_19_weight_NHWC" + ], + "out_args": [ + "NhwcConv_19_out-/decoder/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_19" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "512", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_17", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_19_out-/decoder/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_19" + ], + "const_args": [ + "GroupNorm_17_wts_7_1_16" + ], + "out_args": [ + "GroupNorm_17.out9_17.out7_1_16" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "1024" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_20-/decoder/up_blocks.2/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "NhwcConv_19_out-/decoder/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_19" + ], + "const_args": [ + "NhwcConv_20_weight_NHWC" + ], + "out_args": [ + "NhwcConv_20_out-/decoder/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_20" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "1", + "1", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_16", + "type": "SDSilu", + "in_args": [ + "GroupNorm_17.out9_17.out7_1_16" + ], + "const_args": [ + "Sigmoid_16.weights9_16" + ], + "out_args": [ + "GroupNorm_17_sigmoid_out.9_17.out9_16" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_21-/decoder/up_blocks.2/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_17_sigmoid_out.9_17.out9_16" + ], + "const_args": [ + "NhwcConv_21_weight_NHWC" + ], + "out_args": [ + "NhwcConv_21_out-/decoder/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_21" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "512" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "512" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_18", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_21_out-/decoder/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_21" + ], + "const_args": [ + "GroupNorm_18_wts_7_1_17" + ], + "out_args": [ + "GroupNorm_18.out9_18.out7_1_17" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_17", + "type": "SDSilu", + "in_args": [ + "GroupNorm_18.out9_18.out7_1_17" + ], + "const_args": [ + "Sigmoid_17.weights9_17" + ], + "out_args": [ + "GroupNorm_18_sigmoid_out.9_18.out9_17" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_22-/decoder/up_blocks.2/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_18_sigmoid_out.9_18.out9_17" + ], + "const_args": [ + "NhwcConv_22_weight_NHWC" + ], + "out_args": [ + "NhwcConv_22_out-/decoder/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_22" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.2/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_20_out-/decoder/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_20", + "NhwcConv_22_out-/decoder/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_22" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.2/resnets.0/Add.out_4_1_9" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_19", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.2/resnets.0/Add.out_4_1_9" + ], + "const_args": [ + "GroupNorm_19_wts_7_1_18" + ], + "out_args": [ + "GroupNorm_19.out9_19.out7_1_18" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_18", + "type": "SDSilu", + "in_args": [ + "GroupNorm_19.out9_19.out7_1_18" + ], + "const_args": [ + "Sigmoid_18.weights9_18" + ], + "out_args": [ + "GroupNorm_19_sigmoid_out.9_19.out9_18" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_23-/decoder/up_blocks.2/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_19_sigmoid_out.9_19.out9_18" + ], + "const_args": [ + "NhwcConv_23_weight_NHWC" + ], + "out_args": [ + "NhwcConv_23_out-/decoder/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_23" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_20", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_23_out-/decoder/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_23" + ], + "const_args": [ + "GroupNorm_20_wts_7_1_19" + ], + "out_args": [ + "GroupNorm_20.out9_20.out7_1_19" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_19", + "type": "SDSilu", + "in_args": [ + "GroupNorm_20.out9_20.out7_1_19" + ], + "const_args": [ + "Sigmoid_19.weights9_19" + ], + "out_args": [ + "GroupNorm_20_sigmoid_out.9_20.out9_19" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_24-/decoder/up_blocks.2/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_20_sigmoid_out.9_20.out9_19" + ], + "const_args": [ + "NhwcConv_24_weight_NHWC" + ], + "out_args": [ + "NhwcConv_24_out-/decoder/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_24" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.2/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.2/resnets.0/Add.out_4_1_9", + "NhwcConv_24_out-/decoder/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_24" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.2/resnets.1/Add.out_4_1_10" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_21", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.2/resnets.1/Add.out_4_1_10" + ], + "const_args": [ + "GroupNorm_21_wts_7_1_20" + ], + "out_args": [ + "GroupNorm_21.out9_21.out7_1_20" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_20", + "type": "SDSilu", + "in_args": [ + "GroupNorm_21.out9_21.out7_1_20" + ], + "const_args": [ + "Sigmoid_20.weights9_20" + ], + "out_args": [ + "GroupNorm_21_sigmoid_out.9_21.out9_20" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_25-/decoder/up_blocks.2/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_21_sigmoid_out.9_21.out9_20" + ], + "const_args": [ + "NhwcConv_25_weight_NHWC" + ], + "out_args": [ + "NhwcConv_25_out-/decoder/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_25" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_22", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_25_out-/decoder/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_25" + ], + "const_args": [ + "GroupNorm_22_wts_7_1_21" + ], + "out_args": [ + "GroupNorm_22.out9_22.out7_1_21" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_21", + "type": "SDSilu", + "in_args": [ + "GroupNorm_22.out9_22.out7_1_21" + ], + "const_args": [ + "Sigmoid_21.weights9_21" + ], + "out_args": [ + "GroupNorm_22_sigmoid_out.9_22.out9_21" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_26-/decoder/up_blocks.2/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_22_sigmoid_out.9_22.out9_21" + ], + "const_args": [ + "NhwcConv_26_weight_NHWC" + ], + "out_args": [ + "NhwcConv_26_out-/decoder/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_26" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.2/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.2/resnets.1/Add.out_4_1_10", + "NhwcConv_26_out-/decoder/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_26" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.2/resnets.2/Add.out_4_1_11" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.2/upsamplers.0/Resize", + "type": "SDResize", + "in_args": [ + "/decoder/up_blocks.2/resnets.2/Add.out_4_1_11" + ], + "const_args": [ + "/decoder/up_blocks.2/upsamplers.0/Resize.weights10_2" + ], + "out_args": [ + "/decoder/up_blocks.2/upsamplers.0/Resize_output_0.nhwc2_2.out_10_2" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "256", + "256", + "256" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_27-/decoder/up_blocks.2/upsamplers.0/conv/Conv", + "type": "SDConv", + "in_args": [ + "/decoder/up_blocks.2/upsamplers.0/Resize_output_0.nhwc2_2.out_10_2" + ], + "const_args": [ + "NhwcConv_27_weight_NHWC" + ], + "out_args": [ + "NhwcConv_27_out-/decoder/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_27" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "256", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_23", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_27_out-/decoder/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_27" + ], + "const_args": [ + "GroupNorm_23_wts_7_1_22" + ], + "out_args": [ + "GroupNorm_23.out9_23.out7_1_22" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "512" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_28-/decoder/up_blocks.3/resnets.0/conv_shortcut/Conv", + "type": "SDConv", + "in_args": [ + "NhwcConv_27_out-/decoder/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_27" + ], + "const_args": [ + "NhwcConv_28_weight_NHWC" + ], + "out_args": [ + "NhwcConv_28_out-/decoder/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_28" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "pads": { + "type": "int", + "value": [ + "0", + "0", + "0", + "0" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "1", + "1", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_22", + "type": "SDSilu", + "in_args": [ + "GroupNorm_23.out9_23.out7_1_22" + ], + "const_args": [ + "Sigmoid_22.weights9_22" + ], + "out_args": [ + "GroupNorm_23_sigmoid_out.9_23.out9_22" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_29-/decoder/up_blocks.3/resnets.0/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_23_sigmoid_out.9_23.out9_22" + ], + "const_args": [ + "NhwcConv_29_weight_NHWC" + ], + "out_args": [ + "NhwcConv_29_out-/decoder/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_29" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "256" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "256" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_24", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_29_out-/decoder/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_29" + ], + "const_args": [ + "GroupNorm_24_wts_7_1_23" + ], + "out_args": [ + "GroupNorm_24.out9_24.out7_1_23" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_23", + "type": "SDSilu", + "in_args": [ + "GroupNorm_24.out9_24.out7_1_23" + ], + "const_args": [ + "Sigmoid_23.weights9_23" + ], + "out_args": [ + "GroupNorm_24_sigmoid_out.9_24.out9_23" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_30-/decoder/up_blocks.3/resnets.0/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_24_sigmoid_out.9_24.out9_23" + ], + "const_args": [ + "NhwcConv_30_weight_NHWC" + ], + "out_args": [ + "NhwcConv_30_out-/decoder/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_30" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.3/resnets.0/Add", + "type": "SDAdd", + "in_args": [ + "NhwcConv_28_out-/decoder/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_28", + "NhwcConv_30_out-/decoder/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_30" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.3/resnets.0/Add.out_4_1_12" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_25", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.3/resnets.0/Add.out_4_1_12" + ], + "const_args": [ + "GroupNorm_25_wts_7_1_24" + ], + "out_args": [ + "GroupNorm_25.out9_25.out7_1_24" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_24", + "type": "SDSilu", + "in_args": [ + "GroupNorm_25.out9_25.out7_1_24" + ], + "const_args": [ + "Sigmoid_24.weights9_24" + ], + "out_args": [ + "GroupNorm_25_sigmoid_out.9_25.out9_24" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_31-/decoder/up_blocks.3/resnets.1/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_25_sigmoid_out.9_25.out9_24" + ], + "const_args": [ + "NhwcConv_31_weight_NHWC" + ], + "out_args": [ + "NhwcConv_31_out-/decoder/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_31" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_26", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_31_out-/decoder/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_31" + ], + "const_args": [ + "GroupNorm_26_wts_7_1_25" + ], + "out_args": [ + "GroupNorm_26.out9_26.out7_1_25" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_25", + "type": "SDSilu", + "in_args": [ + "GroupNorm_26.out9_26.out7_1_25" + ], + "const_args": [ + "Sigmoid_25.weights9_25" + ], + "out_args": [ + "GroupNorm_26_sigmoid_out.9_26.out9_25" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_32-/decoder/up_blocks.3/resnets.1/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_26_sigmoid_out.9_26.out9_25" + ], + "const_args": [ + "NhwcConv_32_weight_NHWC" + ], + "out_args": [ + "NhwcConv_32_out-/decoder/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_32" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.3/resnets.1/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.3/resnets.0/Add.out_4_1_12", + "NhwcConv_32_out-/decoder/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_32" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.3/resnets.1/Add.out_4_1_13" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_27", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.3/resnets.1/Add.out_4_1_13" + ], + "const_args": [ + "GroupNorm_27_wts_7_1_26" + ], + "out_args": [ + "GroupNorm_27.out9_27.out7_1_26" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_26", + "type": "SDSilu", + "in_args": [ + "GroupNorm_27.out9_27.out7_1_26" + ], + "const_args": [ + "Sigmoid_26.weights9_26" + ], + "out_args": [ + "GroupNorm_27_sigmoid_out.9_27.out9_26" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_33-/decoder/up_blocks.3/resnets.2/conv1/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_27_sigmoid_out.9_27.out9_26" + ], + "const_args": [ + "NhwcConv_33_weight_NHWC" + ], + "out_args": [ + "NhwcConv_33_out-/decoder/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_33" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_28", + "type": "SDGroupNorm", + "in_args": [ + "NhwcConv_33_out-/decoder/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_33" + ], + "const_args": [ + "GroupNorm_28_wts_7_1_27" + ], + "out_args": [ + "GroupNorm_28.out9_28.out7_1_27" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_27", + "type": "SDSilu", + "in_args": [ + "GroupNorm_28.out9_28.out7_1_27" + ], + "const_args": [ + "Sigmoid_27.weights9_27" + ], + "out_args": [ + "GroupNorm_28_sigmoid_out.9_28.out9_27" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_34-/decoder/up_blocks.3/resnets.2/conv2/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_28_sigmoid_out.9_28.out9_27" + ], + "const_args": [ + "NhwcConv_34_weight_NHWC" + ], + "out_args": [ + "NhwcConv_34_out-/decoder/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_34" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "/decoder/up_blocks.3/resnets.2/Add", + "type": "SDAdd", + "in_args": [ + "/decoder/up_blocks.3/resnets.1/Add.out_4_1_13", + "NhwcConv_34_out-/decoder/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_34" + ], + "const_args": [], + "out_args": [ + "/decoder/up_blocks.3/resnets.2/Add.out_4_1_14" + ], + "attrs": { + "a_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "b_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "c_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "is_bias_add": { + "type": "int", + "value": [ + "0" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "GroupNorm_29", + "type": "SDGroupNorm", + "in_args": [ + "/decoder/up_blocks.3/resnets.2/Add.out_4_1_14" + ], + "const_args": [ + "GroupNorm_29_wts_7_1_28" + ], + "out_args": [ + "GroupNorm_29.out9_29.out7_1_28" + ], + "attrs": { + "epsilon": { + "type": "float", + "value": [ + "9.999999974752427e-07" + ] + }, + "groups": { + "type": "int", + "value": [ + "32" + ] + }, + "channels_last": { + "type": "int", + "value": [ + "1" + ] + }, + "activation": { + "type": "int", + "value": [ + "0" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "wts_shape": { + "type": "int", + "value": [ + "256" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "Sigmoid_28", + "type": "SDSilu", + "in_args": [ + "GroupNorm_29.out9_29.out7_1_28" + ], + "const_args": [ + "Sigmoid_28.weights9_28" + ], + "out_args": [ + "GroupNorm_29_sigmoid_out.9_29.out9_28" + ], + "attrs": { + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "128" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + }, + { + "name": "NhwcConv_35-/decoder/conv_out/Conv", + "type": "SDConv", + "in_args": [ + "GroupNorm_29_sigmoid_out.9_29.out9_28" + ], + "const_args": [ + "NhwcConv_35_weight_NHWC" + ], + "out_args": [ + "NhwcConv_35_out-sample.out0_1_35" + ], + "attrs": { + "auto_pad": { + "type": "str", + "value": [ + "NOTSET" + ] + }, + "dilations": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "group": { + "type": "int", + "value": [ + "1" + ] + }, + "kernel_shape": { + "type": "int", + "value": [ + "3", + "3" + ] + }, + "pads": { + "type": "int", + "value": [ + "1", + "1", + "1", + "1" + ] + }, + "strides": { + "type": "int", + "value": [ + "1", + "1" + ] + }, + "input_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "128" + ] + }, + "output_shape": { + "type": "int", + "value": [ + "1", + "512", + "512", + "3" + ] + }, + "weight_shape": { + "type": "int", + "value": [ + "3", + "3", + "3", + "128" + ] + }, + "out_dtypes": { + "type": "str", + "value": [ + "bfloat16" + ] + }, + "in_dtypes": { + "type": "str", + "value": [ + "bfloat16", + "bfp16ebs8", + "float", + "bfloat16" + ] + }, + "ctrl_packet": { + "type": "int", + "value": [ + "1" + ] + } + } + } + ], + "fused_tensors": { + "in": { + "buffer_size": 32768, + "xrt_arg_id": 0, + "packed_tensors": [ + "Transpose_0_out-latents.out0_1_0" + ] + }, + "out": { + "buffer_size": 1572864, + "xrt_arg_id": 1, + "packed_tensors": [ + "NhwcConv_35_out-sample.out0_1_35" + ] + }, + "scratch": { + "buffer_size": 3519053824, + "xrt_arg_id": 2, + "packed_tensors": [ + "NhwcConv_0_out-/post_quant_conv/Conv_output_0.out0_1_0", + "NhwcConv_1_out-/decoder/conv_in/Conv_output_0.out0_1_1", + "GroupNorm_0.out9_0.out7_1_0", + "GroupNorm_0_sigmoid_out.9_0.out9_0", + "NhwcConv_2_out-/decoder/mid_block/resnets.0/conv1/Conv_output_0.out0_1_2", + "GroupNorm_1.out9_1.out7_1_1", + "GroupNorm_1_sigmoid_out.9_1.out9_1", + "NhwcConv_3_out-/decoder/mid_block/resnets.0/conv2/Conv_output_0.out0_1_3", + "/decoder/mid_block/resnets.0/Add.out_4_1_0", + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0", + "/decoder/mid_block/attentions.0/to_k/Add_output_0.out2_3_0", + "/decoder/mid_block/attentions.0/to_q/Add_output_0.out2_3_1", + "/decoder/mid_block/attentions.0/to_v/Add_output_0.out2_3_2", + "/decoder/mid_block/attentions.0/Reshape_4_output_0.out13_0", + "/decoder/mid_block/attentions.0/Reshape_5_output_0.nhwc3_0.out2_0_0", + "/decoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_1", + "GroupNorm_3.out9_3.out7_1_2", + "GroupNorm_3_sigmoid_out.9_3.out9_2", + "NhwcConv_4_out-/decoder/mid_block/resnets.1/conv1/Conv_output_0.out0_1_4", + "GroupNorm_4.out9_4.out7_1_3", + "GroupNorm_4_sigmoid_out.9_4.out9_3", + "NhwcConv_5_out-/decoder/mid_block/resnets.1/conv2/Conv_output_0.out0_1_5", + "/decoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_2", + "GroupNorm_5.out9_5.out7_1_4", + "GroupNorm_5_sigmoid_out.9_5.out9_4", + "NhwcConv_6_out-/decoder/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_6", + "GroupNorm_6.out9_6.out7_1_5", + "GroupNorm_6_sigmoid_out.9_6.out9_5", + "NhwcConv_7_out-/decoder/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_7", + "/decoder/up_blocks.0/resnets.0/Add_output_0_NHWC.out_4_1_3", + "GroupNorm_7.out9_7.out7_1_6", + "GroupNorm_7_sigmoid_out.9_7.out9_6", + "NhwcConv_8_out-/decoder/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_8", + "GroupNorm_8.out9_8.out7_1_7", + "GroupNorm_8_sigmoid_out.9_8.out9_7", + "NhwcConv_9_out-/decoder/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_9", + "/decoder/up_blocks.0/resnets.1/Add_output_0_NHWC.out_4_1_4", + "GroupNorm_9.out9_9.out7_1_8", + "GroupNorm_9_sigmoid_out.9_9.out9_8", + "NhwcConv_10_out-/decoder/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_10", + "GroupNorm_10.out9_10.out7_1_9", + "GroupNorm_10_sigmoid_out.9_10.out9_9", + "NhwcConv_11_out-/decoder/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_11", + "/decoder/up_blocks.0/resnets.2/Add_output_0.nhwc2_0.out_4_1_5", + "/decoder/up_blocks.0/upsamplers.0/Resize_output_0.nhwc2_0.out_10_0", + "NhwcConv_12_out-/decoder/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_12", + "GroupNorm_11.out9_11.out7_1_10", + "GroupNorm_11_sigmoid_out.9_11.out9_10", + "NhwcConv_13_out-/decoder/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_13", + "GroupNorm_12.out9_12.out7_1_11", + "GroupNorm_12_sigmoid_out.9_12.out9_11", + "NhwcConv_14_out-/decoder/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_14", + "/decoder/up_blocks.1/resnets.0/Add.out_4_1_6", + "GroupNorm_13.out9_13.out7_1_12", + "GroupNorm_13_sigmoid_out.9_13.out9_12", + "NhwcConv_15_out-/decoder/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_15", + "GroupNorm_14.out9_14.out7_1_13", + "GroupNorm_14_sigmoid_out.9_14.out9_13", + "NhwcConv_16_out-/decoder/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_16", + "/decoder/up_blocks.1/resnets.1/Add.out_4_1_7", + "GroupNorm_15.out9_15.out7_1_14", + "GroupNorm_15_sigmoid_out.9_15.out9_14", + "NhwcConv_17_out-/decoder/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_17", + "GroupNorm_16.out9_16.out7_1_15", + "GroupNorm_16_sigmoid_out.9_16.out9_15", + "NhwcConv_18_out-/decoder/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_18", + "/decoder/up_blocks.1/resnets.2/Add.out_4_1_8", + "/decoder/up_blocks.1/upsamplers.0/Resize_output_0.nhwc2_1.out_10_1", + "NhwcConv_19_out-/decoder/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_19", + "GroupNorm_17.out9_17.out7_1_16", + "NhwcConv_20_out-/decoder/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_20", + "GroupNorm_17_sigmoid_out.9_17.out9_16", + "NhwcConv_21_out-/decoder/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_21", + "GroupNorm_18.out9_18.out7_1_17", + "GroupNorm_18_sigmoid_out.9_18.out9_17", + "NhwcConv_22_out-/decoder/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_22", + "/decoder/up_blocks.2/resnets.0/Add.out_4_1_9", + "GroupNorm_19.out9_19.out7_1_18", + "GroupNorm_19_sigmoid_out.9_19.out9_18", + "NhwcConv_23_out-/decoder/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_23", + "GroupNorm_20.out9_20.out7_1_19", + "GroupNorm_20_sigmoid_out.9_20.out9_19", + "NhwcConv_24_out-/decoder/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_24", + "/decoder/up_blocks.2/resnets.1/Add.out_4_1_10", + "GroupNorm_21.out9_21.out7_1_20", + "GroupNorm_21_sigmoid_out.9_21.out9_20", + "NhwcConv_25_out-/decoder/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_25", + "GroupNorm_22.out9_22.out7_1_21", + "GroupNorm_22_sigmoid_out.9_22.out9_21", + "NhwcConv_26_out-/decoder/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_26", + "/decoder/up_blocks.2/resnets.2/Add.out_4_1_11", + "/decoder/up_blocks.2/upsamplers.0/Resize_output_0.nhwc2_2.out_10_2", + "NhwcConv_27_out-/decoder/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_27", + "GroupNorm_23.out9_23.out7_1_22", + "NhwcConv_28_out-/decoder/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_28", + "GroupNorm_23_sigmoid_out.9_23.out9_22", + "NhwcConv_29_out-/decoder/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_29", + "GroupNorm_24.out9_24.out7_1_23", + "GroupNorm_24_sigmoid_out.9_24.out9_23", + "NhwcConv_30_out-/decoder/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_30", + "/decoder/up_blocks.3/resnets.0/Add.out_4_1_12", + "GroupNorm_25.out9_25.out7_1_24", + "GroupNorm_25_sigmoid_out.9_25.out9_24", + "NhwcConv_31_out-/decoder/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_31", + "GroupNorm_26.out9_26.out7_1_25", + "GroupNorm_26_sigmoid_out.9_26.out9_25", + "NhwcConv_32_out-/decoder/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_32", + "/decoder/up_blocks.3/resnets.1/Add.out_4_1_13", + "GroupNorm_27.out9_27.out7_1_26", + "GroupNorm_27_sigmoid_out.9_27.out9_26", + "NhwcConv_33_out-/decoder/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_33", + "GroupNorm_28.out9_28.out7_1_27", + "GroupNorm_28_sigmoid_out.9_28.out9_27", + "NhwcConv_34_out-/decoder/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_34", + "/decoder/up_blocks.3/resnets.2/Add.out_4_1_14", + "GroupNorm_29.out9_29.out7_1_28", + "GroupNorm_29_sigmoid_out.9_29.out9_28" + ] + }, + "const": { + "buffer_size": 58459280, + "xrt_arg_id": 3, + "packed_tensors": [ + "NhwcConv_0_weight_NHWC", + "NhwcConv_1_weight_NHWC", + "GroupNorm_0_wts_7_1_0", + "Sigmoid_0.weights9_0", + "NhwcConv_2_weight_NHWC", + "GroupNorm_1_wts_7_1_1", + "Sigmoid_1.weights9_1", + "NhwcConv_3_weight_NHWC", + "GroupNorm_2_wts_7_0_0", + "onnx::MatMul_918", + "onnx::MatMul_917", + "onnx::MatMul_919", + "/decoder/mid_block/attentions.0/MatMulmha_1_0_mask.13_0", + "onnx::MatMul_927", + "GroupNorm_3_wts_7_1_2", + "Sigmoid_2.weights9_2", + "NhwcConv_4_weight_NHWC", + "GroupNorm_4_wts_7_1_3", + "Sigmoid_3.weights9_3", + "NhwcConv_5_weight_NHWC", + "GroupNorm_5_wts_7_1_4", + "Sigmoid_4.weights9_4", + "NhwcConv_6_weight_NHWC", + "GroupNorm_6_wts_7_1_5", + "Sigmoid_5.weights9_5", + "NhwcConv_7_weight_NHWC", + "GroupNorm_7_wts_7_1_6", + "Sigmoid_6.weights9_6", + "NhwcConv_8_weight_NHWC", + "GroupNorm_8_wts_7_1_7", + "Sigmoid_7.weights9_7", + "NhwcConv_9_weight_NHWC", + "GroupNorm_9_wts_7_1_8", + "Sigmoid_8.weights9_8", + "NhwcConv_10_weight_NHWC", + "GroupNorm_10_wts_7_1_9", + "Sigmoid_9.weights9_9", + "NhwcConv_11_weight_NHWC", + "/decoder/up_blocks.0/upsamplers.0/Resize.weights10_0", + "NhwcConv_12_weight_NHWC", + "GroupNorm_11_wts_7_1_10", + "Sigmoid_10.weights9_10", + "NhwcConv_13_weight_NHWC", + "GroupNorm_12_wts_7_1_11", + "Sigmoid_11.weights9_11", + "NhwcConv_14_weight_NHWC", + "GroupNorm_13_wts_7_1_12", + "Sigmoid_12.weights9_12", + "NhwcConv_15_weight_NHWC", + "GroupNorm_14_wts_7_1_13", + "Sigmoid_13.weights9_13", + "NhwcConv_16_weight_NHWC", + "GroupNorm_15_wts_7_1_14", + "Sigmoid_14.weights9_14", + "NhwcConv_17_weight_NHWC", + "GroupNorm_16_wts_7_1_15", + "Sigmoid_15.weights9_15", + "NhwcConv_18_weight_NHWC", + "/decoder/up_blocks.1/upsamplers.0/Resize.weights10_1", + "NhwcConv_19_weight_NHWC", + "GroupNorm_17_wts_7_1_16", + "NhwcConv_20_weight_NHWC", + "Sigmoid_16.weights9_16", + "NhwcConv_21_weight_NHWC", + "GroupNorm_18_wts_7_1_17", + "Sigmoid_17.weights9_17", + "NhwcConv_22_weight_NHWC", + "GroupNorm_19_wts_7_1_18", + "Sigmoid_18.weights9_18", + "NhwcConv_23_weight_NHWC", + "GroupNorm_20_wts_7_1_19", + "Sigmoid_19.weights9_19", + "NhwcConv_24_weight_NHWC", + "GroupNorm_21_wts_7_1_20", + "Sigmoid_20.weights9_20", + "NhwcConv_25_weight_NHWC", + "GroupNorm_22_wts_7_1_21", + "Sigmoid_21.weights9_21", + "NhwcConv_26_weight_NHWC", + "/decoder/up_blocks.2/upsamplers.0/Resize.weights10_2", + "NhwcConv_27_weight_NHWC", + "GroupNorm_23_wts_7_1_22", + "NhwcConv_28_weight_NHWC", + "Sigmoid_22.weights9_22", + "NhwcConv_29_weight_NHWC", + "GroupNorm_24_wts_7_1_23", + "Sigmoid_23.weights9_23", + "NhwcConv_30_weight_NHWC", + "GroupNorm_25_wts_7_1_24", + "Sigmoid_24.weights9_24", + "NhwcConv_31_weight_NHWC", + "GroupNorm_26_wts_7_1_25", + "Sigmoid_25.weights9_25", + "NhwcConv_32_weight_NHWC", + "GroupNorm_27_wts_7_1_26", + "Sigmoid_26.weights9_26", + "NhwcConv_33_weight_NHWC", + "GroupNorm_28_wts_7_1_27", + "Sigmoid_27.weights9_27", + "NhwcConv_34_weight_NHWC", + "GroupNorm_29_wts_7_1_28", + "Sigmoid_28.weights9_28", + "NhwcConv_35_weight_NHWC" + ] + }, + "super_instr": { + "buffer_size": 0, + "xrt_arg_id": 4, + "packed_tensors": [] + } + }, + "tensor_map": { + "Transpose_0_out-latents.out0_1_0": { + "packed_buffer_label": "in", + "xrt_arg_id": 0, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 4 + ], + "size_in_bytes": 32768, + "offset": 0 + }, + "NhwcConv_35_out-sample.out0_1_35": { + "packed_buffer_label": "out", + "xrt_arg_id": 1, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 3 + ], + "size_in_bytes": 1572864, + "offset": 0 + }, + "NhwcConv_0_out-/post_quant_conv/Conv_output_0.out0_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 4 + ], + "size_in_bytes": 32768, + "offset": 0 + }, + "NhwcConv_1_out-/decoder/conv_in/Conv_output_0.out0_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 32768 + }, + "GroupNorm_0.out9_0.out7_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 4227072 + }, + "GroupNorm_0_sigmoid_out.9_0.out9_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 8421376 + }, + "NhwcConv_2_out-/decoder/mid_block/resnets.0/conv1/Conv_output_0.out0_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 12615680 + }, + "GroupNorm_1.out9_1.out7_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 16809984 + }, + "GroupNorm_1_sigmoid_out.9_1.out9_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 21004288 + }, + "NhwcConv_3_out-/decoder/mid_block/resnets.0/conv2/Conv_output_0.out0_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 25198592 + }, + "/decoder/mid_block/resnets.0/Add.out_4_1_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 29392896 + }, + "/decoder/mid_block/attentions.0/group_norm/Add_output_0_4d_NHWC.out7_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 4096, + 512 + ], + "size_in_bytes": 4194304, + "offset": 33587200 + }, + "/decoder/mid_block/attentions.0/to_k/Add_output_0.out2_3_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 4096, + 512 + ], + "size_in_bytes": 4194304, + "offset": 37781504 + }, + "/decoder/mid_block/attentions.0/to_q/Add_output_0.out2_3_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 4096, + 512 + ], + "size_in_bytes": 4194304, + "offset": 41975808 + }, + "/decoder/mid_block/attentions.0/to_v/Add_output_0.out2_3_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 4096, + 512 + ], + "size_in_bytes": 4194304, + "offset": 46170112 + }, + "/decoder/mid_block/attentions.0/Reshape_4_output_0.out13_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 4096, + 512 + ], + "size_in_bytes": 4194304, + "offset": 50364416 + }, + "/decoder/mid_block/attentions.0/Reshape_5_output_0.nhwc3_0.out2_0_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 54558720 + }, + "/decoder/mid_block/attentions.0/Add_output_0_NHWC.out_4_1_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 58753024 + }, + "GroupNorm_3.out9_3.out7_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 62947328 + }, + "GroupNorm_3_sigmoid_out.9_3.out9_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 67141632 + }, + "NhwcConv_4_out-/decoder/mid_block/resnets.1/conv1/Conv_output_0.out0_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 71335936 + }, + "GroupNorm_4.out9_4.out7_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 75530240 + }, + "GroupNorm_4_sigmoid_out.9_4.out9_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 79724544 + }, + "NhwcConv_5_out-/decoder/mid_block/resnets.1/conv2/Conv_output_0.out0_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 83918848 + }, + "/decoder/mid_block/resnets.1/Add_output_0_NHWC.out_4_1_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 88113152 + }, + "GroupNorm_5.out9_5.out7_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 92307456 + }, + "GroupNorm_5_sigmoid_out.9_5.out9_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 96501760 + }, + "NhwcConv_6_out-/decoder/up_blocks.0/resnets.0/conv1/Conv_output_0.out0_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 100696064 + }, + "GroupNorm_6.out9_6.out7_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 104890368 + }, + "GroupNorm_6_sigmoid_out.9_6.out9_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 109084672 + }, + "NhwcConv_7_out-/decoder/up_blocks.0/resnets.0/conv2/Conv_output_0.out0_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 113278976 + }, + "/decoder/up_blocks.0/resnets.0/Add_output_0_NHWC.out_4_1_3": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 117473280 + }, + "GroupNorm_7.out9_7.out7_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 121667584 + }, + "GroupNorm_7_sigmoid_out.9_7.out9_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 125861888 + }, + "NhwcConv_8_out-/decoder/up_blocks.0/resnets.1/conv1/Conv_output_0.out0_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 130056192 + }, + "GroupNorm_8.out9_8.out7_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 134250496 + }, + "GroupNorm_8_sigmoid_out.9_8.out9_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 138444800 + }, + "NhwcConv_9_out-/decoder/up_blocks.0/resnets.1/conv2/Conv_output_0.out0_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 142639104 + }, + "/decoder/up_blocks.0/resnets.1/Add_output_0_NHWC.out_4_1_4": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 146833408 + }, + "GroupNorm_9.out9_9.out7_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 151027712 + }, + "GroupNorm_9_sigmoid_out.9_9.out9_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 155222016 + }, + "NhwcConv_10_out-/decoder/up_blocks.0/resnets.2/conv1/Conv_output_0.out0_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 159416320 + }, + "GroupNorm_10.out9_10.out7_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 163610624 + }, + "GroupNorm_10_sigmoid_out.9_10.out9_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 167804928 + }, + "NhwcConv_11_out-/decoder/up_blocks.0/resnets.2/conv2/Conv_output_0.out0_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 171999232 + }, + "/decoder/up_blocks.0/resnets.2/Add_output_0.nhwc2_0.out_4_1_5": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 64, + 64, + 512 + ], + "size_in_bytes": 4194304, + "offset": 176193536 + }, + "/decoder/up_blocks.0/upsamplers.0/Resize_output_0.nhwc2_0.out_10_0": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 180387840 + }, + "NhwcConv_12_out-/decoder/up_blocks.0/upsamplers.0/conv/Conv_output_0.out0_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 197165056 + }, + "GroupNorm_11.out9_11.out7_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 213942272 + }, + "GroupNorm_11_sigmoid_out.9_11.out9_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 230719488 + }, + "NhwcConv_13_out-/decoder/up_blocks.1/resnets.0/conv1/Conv_output_0.out0_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 247496704 + }, + "GroupNorm_12.out9_12.out7_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 264273920 + }, + "GroupNorm_12_sigmoid_out.9_12.out9_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 281051136 + }, + "NhwcConv_14_out-/decoder/up_blocks.1/resnets.0/conv2/Conv_output_0.out0_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 297828352 + }, + "/decoder/up_blocks.1/resnets.0/Add.out_4_1_6": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 314605568 + }, + "GroupNorm_13.out9_13.out7_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 331382784 + }, + "GroupNorm_13_sigmoid_out.9_13.out9_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 348160000 + }, + "NhwcConv_15_out-/decoder/up_blocks.1/resnets.1/conv1/Conv_output_0.out0_1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 364937216 + }, + "GroupNorm_14.out9_14.out7_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 381714432 + }, + "GroupNorm_14_sigmoid_out.9_14.out9_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 398491648 + }, + "NhwcConv_16_out-/decoder/up_blocks.1/resnets.1/conv2/Conv_output_0.out0_1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 415268864 + }, + "/decoder/up_blocks.1/resnets.1/Add.out_4_1_7": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 432046080 + }, + "GroupNorm_15.out9_15.out7_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 448823296 + }, + "GroupNorm_15_sigmoid_out.9_15.out9_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 465600512 + }, + "NhwcConv_17_out-/decoder/up_blocks.1/resnets.2/conv1/Conv_output_0.out0_1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 482377728 + }, + "GroupNorm_16.out9_16.out7_1_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 499154944 + }, + "GroupNorm_16_sigmoid_out.9_16.out9_15": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 515932160 + }, + "NhwcConv_18_out-/decoder/up_blocks.1/resnets.2/conv2/Conv_output_0.out0_1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 532709376 + }, + "/decoder/up_blocks.1/resnets.2/Add.out_4_1_8": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 128, + 128, + 512 + ], + "size_in_bytes": 16777216, + "offset": 549486592 + }, + "/decoder/up_blocks.1/upsamplers.0/Resize_output_0.nhwc2_1.out_10_1": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 512 + ], + "size_in_bytes": 67108864, + "offset": 566263808 + }, + "NhwcConv_19_out-/decoder/up_blocks.1/upsamplers.0/conv/Conv_output_0.out0_1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 512 + ], + "size_in_bytes": 67108864, + "offset": 633372672 + }, + "GroupNorm_17.out9_17.out7_1_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 512 + ], + "size_in_bytes": 67108864, + "offset": 700481536 + }, + "NhwcConv_20_out-/decoder/up_blocks.2/resnets.0/conv_shortcut/Conv_output_0.out0_1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 767590400 + }, + "GroupNorm_17_sigmoid_out.9_17.out9_16": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 512 + ], + "size_in_bytes": 67108864, + "offset": 801144832 + }, + "NhwcConv_21_out-/decoder/up_blocks.2/resnets.0/conv1/Conv_output_0.out0_1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 868253696 + }, + "GroupNorm_18.out9_18.out7_1_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 901808128 + }, + "GroupNorm_18_sigmoid_out.9_18.out9_17": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 935362560 + }, + "NhwcConv_22_out-/decoder/up_blocks.2/resnets.0/conv2/Conv_output_0.out0_1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 968916992 + }, + "/decoder/up_blocks.2/resnets.0/Add.out_4_1_9": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1002471424 + }, + "GroupNorm_19.out9_19.out7_1_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1036025856 + }, + "GroupNorm_19_sigmoid_out.9_19.out9_18": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1069580288 + }, + "NhwcConv_23_out-/decoder/up_blocks.2/resnets.1/conv1/Conv_output_0.out0_1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1103134720 + }, + "GroupNorm_20.out9_20.out7_1_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1136689152 + }, + "GroupNorm_20_sigmoid_out.9_20.out9_19": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1170243584 + }, + "NhwcConv_24_out-/decoder/up_blocks.2/resnets.1/conv2/Conv_output_0.out0_1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1203798016 + }, + "/decoder/up_blocks.2/resnets.1/Add.out_4_1_10": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1237352448 + }, + "GroupNorm_21.out9_21.out7_1_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1270906880 + }, + "GroupNorm_21_sigmoid_out.9_21.out9_20": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1304461312 + }, + "NhwcConv_25_out-/decoder/up_blocks.2/resnets.2/conv1/Conv_output_0.out0_1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1338015744 + }, + "GroupNorm_22.out9_22.out7_1_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1371570176 + }, + "GroupNorm_22_sigmoid_out.9_22.out9_21": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1405124608 + }, + "NhwcConv_26_out-/decoder/up_blocks.2/resnets.2/conv2/Conv_output_0.out0_1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1438679040 + }, + "/decoder/up_blocks.2/resnets.2/Add.out_4_1_11": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 256, + 256, + 256 + ], + "size_in_bytes": 33554432, + "offset": 1472233472 + }, + "/decoder/up_blocks.2/upsamplers.0/Resize_output_0.nhwc2_2.out_10_2": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 256 + ], + "size_in_bytes": 134217728, + "offset": 1505787904 + }, + "NhwcConv_27_out-/decoder/up_blocks.2/upsamplers.0/conv/Conv_output_0.out0_1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 256 + ], + "size_in_bytes": 134217728, + "offset": 1640005632 + }, + "GroupNorm_23.out9_23.out7_1_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 256 + ], + "size_in_bytes": 134217728, + "offset": 1774223360 + }, + "NhwcConv_28_out-/decoder/up_blocks.3/resnets.0/conv_shortcut/Conv_output_0.out0_1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 1908441088 + }, + "GroupNorm_23_sigmoid_out.9_23.out9_22": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 256 + ], + "size_in_bytes": 134217728, + "offset": 1975549952 + }, + "NhwcConv_29_out-/decoder/up_blocks.3/resnets.0/conv1/Conv_output_0.out0_1_29": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2109767680 + }, + "GroupNorm_24.out9_24.out7_1_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2176876544 + }, + "GroupNorm_24_sigmoid_out.9_24.out9_23": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2243985408 + }, + "NhwcConv_30_out-/decoder/up_blocks.3/resnets.0/conv2/Conv_output_0.out0_1_30": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2311094272 + }, + "/decoder/up_blocks.3/resnets.0/Add.out_4_1_12": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2378203136 + }, + "GroupNorm_25.out9_25.out7_1_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2445312000 + }, + "GroupNorm_25_sigmoid_out.9_25.out9_24": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2512420864 + }, + "NhwcConv_31_out-/decoder/up_blocks.3/resnets.1/conv1/Conv_output_0.out0_1_31": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2579529728 + }, + "GroupNorm_26.out9_26.out7_1_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2646638592 + }, + "GroupNorm_26_sigmoid_out.9_26.out9_25": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2713747456 + }, + "NhwcConv_32_out-/decoder/up_blocks.3/resnets.1/conv2/Conv_output_0.out0_1_32": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2780856320 + }, + "/decoder/up_blocks.3/resnets.1/Add.out_4_1_13": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2847965184 + }, + "GroupNorm_27.out9_27.out7_1_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2915074048 + }, + "GroupNorm_27_sigmoid_out.9_27.out9_26": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 2982182912 + }, + "NhwcConv_33_out-/decoder/up_blocks.3/resnets.2/conv1/Conv_output_0.out0_1_33": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3049291776 + }, + "GroupNorm_28.out9_28.out7_1_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3116400640 + }, + "GroupNorm_28_sigmoid_out.9_28.out9_27": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3183509504 + }, + "NhwcConv_34_out-/decoder/up_blocks.3/resnets.2/conv2/Conv_output_0.out0_1_34": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3250618368 + }, + "/decoder/up_blocks.3/resnets.2/Add.out_4_1_14": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3317727232 + }, + "GroupNorm_29.out9_29.out7_1_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3384836096 + }, + "GroupNorm_29_sigmoid_out.9_29.out9_28": { + "packed_buffer_label": "scratch", + "xrt_arg_id": 2, + "dtype": "bfloat16", + "shape": [ + 1, + 512, + 512, + 128 + ], + "size_in_bytes": 67108864, + "offset": 3451944960 + }, + "NhwcConv_0_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 400 + ], + "size_in_bytes": 400, + "offset": 0, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_0.const", + "file_size": 400 + }, + "NhwcConv_1_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 49664 + ], + "size_in_bytes": 49664, + "offset": 400, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_1.const", + "file_size": 49664 + }, + "GroupNorm_0_wts_7_1_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 50064, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_2.const", + "file_size": 2048 + }, + "Sigmoid_0.weights9_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 52112, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_3.const", + "file_size": 256 + }, + "NhwcConv_2_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 52368, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_4.const", + "file_size": 2785280 + }, + "GroupNorm_1_wts_7_1_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 2837648, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_5.const", + "file_size": 2048 + }, + "Sigmoid_1.weights9_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 2839696, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_6.const", + "file_size": 256 + }, + "NhwcConv_3_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 2839952, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_7.const", + "file_size": 2785280 + }, + "GroupNorm_2_wts_7_0_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 5625232, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_8.const", + "file_size": 2048 + }, + "onnx::MatMul_918": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 299008 + ], + "size_in_bytes": 299008, + "offset": 5627280, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_9.const", + "file_size": 299008 + }, + "onnx::MatMul_917": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 299008 + ], + "size_in_bytes": 299008, + "offset": 5926288, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_10.const", + "file_size": 299008 + }, + "onnx::MatMul_919": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 299008 + ], + "size_in_bytes": 299008, + "offset": 6225296, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_11.const", + "file_size": 299008 + }, + "/decoder/mid_block/attentions.0/MatMulmha_1_0_mask.13_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 4096 + ], + "size_in_bytes": 8192, + "offset": 6524304, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_12.const", + "file_size": 8192 + }, + "onnx::MatMul_927": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 299008 + ], + "size_in_bytes": 299008, + "offset": 6532496, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_13.const", + "file_size": 299008 + }, + "GroupNorm_3_wts_7_1_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 6831504, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_14.const", + "file_size": 2048 + }, + "Sigmoid_2.weights9_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 6833552, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_15.const", + "file_size": 256 + }, + "NhwcConv_4_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 6833808, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_16.const", + "file_size": 2785280 + }, + "GroupNorm_4_wts_7_1_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 9619088, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_17.const", + "file_size": 2048 + }, + "Sigmoid_3.weights9_3": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 9621136, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_18.const", + "file_size": 256 + }, + "NhwcConv_5_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 9621392, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_19.const", + "file_size": 2785280 + }, + "GroupNorm_5_wts_7_1_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 12406672, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_20.const", + "file_size": 2048 + }, + "Sigmoid_4.weights9_4": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 12408720, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_21.const", + "file_size": 256 + }, + "NhwcConv_6_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 12408976, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_22.const", + "file_size": 2785280 + }, + "GroupNorm_6_wts_7_1_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 15194256, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_23.const", + "file_size": 2048 + }, + "Sigmoid_5.weights9_5": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 15196304, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_24.const", + "file_size": 256 + }, + "NhwcConv_7_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 15196560, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_25.const", + "file_size": 2785280 + }, + "GroupNorm_7_wts_7_1_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 17981840, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_26.const", + "file_size": 2048 + }, + "Sigmoid_6.weights9_6": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 17983888, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_27.const", + "file_size": 256 + }, + "NhwcConv_8_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 17984144, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_28.const", + "file_size": 2785280 + }, + "GroupNorm_8_wts_7_1_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 20769424, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_29.const", + "file_size": 2048 + }, + "Sigmoid_7.weights9_7": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 20771472, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_30.const", + "file_size": 256 + }, + "NhwcConv_9_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 20771728, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_31.const", + "file_size": 2785280 + }, + "GroupNorm_9_wts_7_1_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 23557008, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_32.const", + "file_size": 2048 + }, + "Sigmoid_8.weights9_8": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 23559056, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_33.const", + "file_size": 256 + }, + "NhwcConv_10_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 23559312, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_34.const", + "file_size": 2785280 + }, + "GroupNorm_10_wts_7_1_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 26344592, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_35.const", + "file_size": 2048 + }, + "Sigmoid_9.weights9_9": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 26346640, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_36.const", + "file_size": 256 + }, + "NhwcConv_11_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 26346896, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_37.const", + "file_size": 2785280 + }, + "/decoder/up_blocks.0/upsamplers.0/Resize.weights10_0": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 29132176, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_38.const", + "file_size": 256 + }, + "NhwcConv_12_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 29132432, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_39.const", + "file_size": 2785280 + }, + "GroupNorm_11_wts_7_1_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 31917712, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_40.const", + "file_size": 2048 + }, + "Sigmoid_10.weights9_10": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 31919760, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_41.const", + "file_size": 256 + }, + "NhwcConv_13_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 31920016, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_42.const", + "file_size": 2785280 + }, + "GroupNorm_12_wts_7_1_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 34705296, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_43.const", + "file_size": 2048 + }, + "Sigmoid_11.weights9_11": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 34707344, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_44.const", + "file_size": 256 + }, + "NhwcConv_14_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 34707600, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_45.const", + "file_size": 2785280 + }, + "GroupNorm_13_wts_7_1_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 37492880, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_46.const", + "file_size": 2048 + }, + "Sigmoid_12.weights9_12": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 37494928, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_47.const", + "file_size": 256 + }, + "NhwcConv_15_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 37495184, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_48.const", + "file_size": 2785280 + }, + "GroupNorm_14_wts_7_1_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 40280464, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_49.const", + "file_size": 2048 + }, + "Sigmoid_13.weights9_13": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 40282512, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_50.const", + "file_size": 256 + }, + "NhwcConv_16_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 40282768, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_51.const", + "file_size": 2785280 + }, + "GroupNorm_15_wts_7_1_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 43068048, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_52.const", + "file_size": 2048 + }, + "Sigmoid_14.weights9_14": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 43070096, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_53.const", + "file_size": 256 + }, + "NhwcConv_17_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 43070352, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_54.const", + "file_size": 2785280 + }, + "GroupNorm_16_wts_7_1_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 45855632, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_55.const", + "file_size": 2048 + }, + "Sigmoid_15.weights9_15": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 45857680, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_56.const", + "file_size": 256 + }, + "NhwcConv_18_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 45857936, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_57.const", + "file_size": 2785280 + }, + "/decoder/up_blocks.1/upsamplers.0/Resize.weights10_1": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 48643216, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_58.const", + "file_size": 256 + }, + "NhwcConv_19_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 2785280 + ], + "size_in_bytes": 2785280, + "offset": 48643472, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_59.const", + "file_size": 2785280 + }, + "GroupNorm_17_wts_7_1_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 1024 + ], + "size_in_bytes": 2048, + "offset": 51428752, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_60.const", + "file_size": 2048 + }, + "NhwcConv_20_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 163840 + ], + "size_in_bytes": 163840, + "offset": 51430800, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_61.const", + "file_size": 163840 + }, + "Sigmoid_16.weights9_16": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 51594640, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_62.const", + "file_size": 256 + }, + "NhwcConv_21_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 1392640 + ], + "size_in_bytes": 1392640, + "offset": 51594896, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_63.const", + "file_size": 1392640 + }, + "GroupNorm_18_wts_7_1_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 52987536, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_64.const", + "file_size": 1024 + }, + "Sigmoid_17.weights9_17": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 52988560, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_65.const", + "file_size": 256 + }, + "NhwcConv_22_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 52988816, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_66.const", + "file_size": 696320 + }, + "GroupNorm_19_wts_7_1_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 53685136, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_67.const", + "file_size": 1024 + }, + "Sigmoid_18.weights9_18": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 53686160, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_68.const", + "file_size": 256 + }, + "NhwcConv_23_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 53686416, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_69.const", + "file_size": 696320 + }, + "GroupNorm_20_wts_7_1_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 54382736, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_70.const", + "file_size": 1024 + }, + "Sigmoid_19.weights9_19": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 54383760, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_71.const", + "file_size": 256 + }, + "NhwcConv_24_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 54384016, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_72.const", + "file_size": 696320 + }, + "GroupNorm_21_wts_7_1_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 55080336, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_73.const", + "file_size": 1024 + }, + "Sigmoid_20.weights9_20": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 55081360, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_74.const", + "file_size": 256 + }, + "NhwcConv_25_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 55081616, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_75.const", + "file_size": 696320 + }, + "GroupNorm_22_wts_7_1_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 55777936, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_76.const", + "file_size": 1024 + }, + "Sigmoid_21.weights9_21": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 55778960, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_77.const", + "file_size": 256 + }, + "NhwcConv_26_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 55779216, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_78.const", + "file_size": 696320 + }, + "/decoder/up_blocks.2/upsamplers.0/Resize.weights10_2": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 56475536, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_79.const", + "file_size": 256 + }, + "NhwcConv_27_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 696320 + ], + "size_in_bytes": 696320, + "offset": 56475792, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_80.const", + "file_size": 696320 + }, + "GroupNorm_23_wts_7_1_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 512 + ], + "size_in_bytes": 1024, + "offset": 57172112, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_81.const", + "file_size": 1024 + }, + "NhwcConv_28_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 40960 + ], + "size_in_bytes": 40960, + "offset": 57173136, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_82.const", + "file_size": 40960 + }, + "Sigmoid_22.weights9_22": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 57214096, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_83.const", + "file_size": 256 + }, + "NhwcConv_29_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 348160 + ], + "size_in_bytes": 348160, + "offset": 57214352, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_84.const", + "file_size": 348160 + }, + "GroupNorm_24_wts_7_1_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 57562512, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_85.const", + "file_size": 512 + }, + "Sigmoid_23.weights9_23": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 57563024, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_86.const", + "file_size": 256 + }, + "NhwcConv_30_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 174080 + ], + "size_in_bytes": 174080, + "offset": 57563280, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_87.const", + "file_size": 174080 + }, + "GroupNorm_25_wts_7_1_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 57737360, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_88.const", + "file_size": 512 + }, + "Sigmoid_24.weights9_24": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 57737872, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_89.const", + "file_size": 256 + }, + "NhwcConv_31_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 174080 + ], + "size_in_bytes": 174080, + "offset": 57738128, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_90.const", + "file_size": 174080 + }, + "GroupNorm_26_wts_7_1_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 57912208, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_91.const", + "file_size": 512 + }, + "Sigmoid_25.weights9_25": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 57912720, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_92.const", + "file_size": 256 + }, + "NhwcConv_32_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 174080 + ], + "size_in_bytes": 174080, + "offset": 57912976, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_93.const", + "file_size": 174080 + }, + "GroupNorm_27_wts_7_1_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 58087056, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_94.const", + "file_size": 512 + }, + "Sigmoid_26.weights9_26": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 58087568, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_95.const", + "file_size": 256 + }, + "NhwcConv_33_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 174080 + ], + "size_in_bytes": 174080, + "offset": 58087824, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_96.const", + "file_size": 174080 + }, + "GroupNorm_28_wts_7_1_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 58261904, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_97.const", + "file_size": 512 + }, + "Sigmoid_27.weights9_27": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 58262416, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_98.const", + "file_size": 256 + }, + "NhwcConv_34_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 174080 + ], + "size_in_bytes": 174080, + "offset": 58262672, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_99.const", + "file_size": 174080 + }, + "GroupNorm_29_wts_7_1_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 256 + ], + "size_in_bytes": 512, + "offset": 58436752, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_100.const", + "file_size": 512 + }, + "Sigmoid_28.weights9_28": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfloat16", + "shape": [ + 128 + ], + "size_in_bytes": 256, + "offset": 58437264, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_101.const", + "file_size": 256 + }, + "NhwcConv_35_weight_NHWC": { + "packed_buffer_label": "const", + "xrt_arg_id": 3, + "dtype": "bfp16ebs8", + "shape": [ + 21760 + ], + "size_in_bytes": 21760, + "offset": 58437520, + "file_name": ".cache\\NhwcConv_0-post_quant_convConv_102.const", + "file_size": 21760 + } + }, + "aux_info": {} +} \ No newline at end of file