diff --git "a/llm.mnn.json" "b/llm.mnn.json" new file mode 100644--- /dev/null +++ "b/llm.mnn.json" @@ -0,0 +1,29906 @@ + +{ "bizCode": "MNNTest", "extraInfo": +{ "version": "3.2.5" } +, "oplists": +[ +{ "main_type": "Input", "main": +{ "dims": +[ 1, 1, 1152 ] +, "dtype": "DT_FLOAT", "dformat": "NCHW" } +, "name": "input_ids", "outputIndexes": +[ 4 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 2, 1, -1, -1, 3 ] +, "dtype": "DT_FLOAT", "dformat": "NCHW" } +, "name": "attention_mask", "outputIndexes": +[ 131 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 1, -1 ] +, "dtype": "DT_INT32", "dformat": "NCHW" } +, "name": "position_ids", "outputIndexes": +[ 2 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 26, 2, 1, -1, 1, 256 ] +, "dtype": "DT_FLOAT", "dformat": "NCHW" } +, "name": "past_key_values", "outputIndexes": +[ 0 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Input", "main": +{ "dims": +[ 1 ] +, "dtype": "DT_INT32", "dformat": "NCHW" } +, "name": "logits_index", "outputIndexes": +[ 3 ] +, "type": "Input", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 0 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1 ] +, "dimType": "NCHW" } +, "name": "presents", "outputIndexes": +[ 1 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 34.0 ] + } +, "name": "/Constant_output_0", "outputIndexes": +[ 5 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 4, 5 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/Mul_output_0", "outputIndexes": +[ 6 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 3 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1, -1, 1152 ] + } +, "name": "/blocks.0/Constant_output_0", "outputIndexes": +[ 7 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 6, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/Reshape_output_0", "outputIndexes": +[ 8 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 8 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 0, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.0/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 9 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 9 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2968 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2968 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2969 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2969 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 9216, 589846, 147456, 0, 0 ] + } +, "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": +[ 2970 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2970 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2971 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2971 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 10 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 9 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_output_0", "outputIndexes": +[ 11 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 11 ] +, "main_type": "NONE", "name": "Shape53", "outputIndexes": +[ 12 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 11 ] +, "main_type": "NONE", "name": "Rank55", "outputIndexes": +[ 13 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 13, 13 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp57", "outputIndexes": +[ 14 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 14 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze58", "outputIndexes": +[ 15 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1 ] + } +, "name": "Const9", "outputIndexes": +[ 16 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 14, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp60", "outputIndexes": +[ 17 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 17 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze61", "outputIndexes": +[ 18 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1 ] + } +, "name": "Unsqueeze63", "outputIndexes": +[ 19 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 15, 18, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice64", "outputIndexes": +[ 20 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 20 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze65", "outputIndexes": +[ 21 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 21, 21 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp67", "outputIndexes": +[ 22 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 11, 22, 14 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_output_0", "outputIndexes": +[ 23 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 0 ] + } +, "name": "/rotary/Constant_4_output_0", "outputIndexes": +[ 24 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 23, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 25 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 14 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze77", "outputIndexes": +[ 26 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 17 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze80", "outputIndexes": +[ 27 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 12, 26, 27, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice83", "outputIndexes": +[ 28 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 28 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze84", "outputIndexes": +[ 29 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 29 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp85", "outputIndexes": +[ 30 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 30, 29 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp86", "outputIndexes": +[ 31 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 11, 31, 14 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_1_output_0", "outputIndexes": +[ 32 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 32, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 33 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 4 ] + } +, "name": "/blocks.0/self_attn/Constant_3_output_0", "outputIndexes": +[ 34 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 256 ] + } +, "name": "/blocks.0/self_attn/Constant_4_output_0", "outputIndexes": +[ 35 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 25, 33, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_output_0", "outputIndexes": +[ 36 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 10, 36 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_output_0", "outputIndexes": +[ 37 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 37 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 746518, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.0/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 39 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2 ] +, "main_type": "CastParam", "main": +{ "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } +, "name": "/rotary/Cast_output_0", "outputIndexes": +[ 40 ] +, "type": "Cast", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 2 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ -1, 1 ] + } +, "name": "/rotary/Constant_1_output_0", "outputIndexes": +[ 41 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 40, 41 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/rotary/Reshape_output_0", "outputIndexes": +[ 42 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 128 ] +, "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 1.0, 0.897687, 0.805842, 0.723394, 0.649382, 0.582942, 0.523299, 0.469759, 0.421697, 0.378552, 0.339821, 0.305053, 0.273842, 0.245824, 0.220673, 0.198096, 0.177828, 0.159634, 0.143301, 0.12864, 0.115478, 0.103663, 0.093057, 0.083536, 0.074989, 0.067317, 0.06043, 0.054247, 0.048697, 0.043714, 0.039242, 0.035227, 0.031623, 0.028387, 0.025483, 0.022876, 0.020535, 0.018434, 0.016548, 0.014855, 0.013335, 0.011971, 0.010746, 0.009647, 0.00866, 0.007774, 0.006978, 0.006264, 0.005623, 0.005048, 0.004532, 0.004068, 0.003652, 0.003278, 0.002943, 0.002642, 0.002371, 0.002129, 0.001911, 0.001715, 0.00154, 0.001382, 0.001241, 0.001114, 0.001, 0.000898, 0.000806, 0.000723, 0.000649, 0.000583, 0.000523, 0.00047, 0.000422, 0.000379, 0.00034, 0.000305, 0.000274, 0.000246, 0.000221, 0.000198, 0.000178, 0.00016, 0.000143, 0.000129, 0.000115, 0.000104, 0.000093, 0.000084, 0.000075, 0.000067, 0.00006, 0.000054, 0.000049, 0.000044, 0.000039, 0.000035, 0.000032, 0.000028, 0.000025, 0.000023, 0.000021, 0.000018, 0.000017, 0.000015, 0.000013, 0.000012, 0.000011, 0.00001, 0.000009, 0.000008, 0.000007, 0.000006, 0.000006, 0.000005, 0.000005, 0.000004, 0.000004, 0.000003, 0.000003, 0.000003, 0.000002, 0.000002, 0.000002, 0.000002, 0.000002, 0.000001, 0.000001, 0.000001 ] + } +, "name": "/rotary/Constant_2_output_0", "outputIndexes": +[ 43 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 42, 43 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/rotary/Mul_output_0", "outputIndexes": +[ 44 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 44 ] +, "main_type": "UnaryOp", "main": +{ "opType": "COS", "T": "DT_FLOAT" } +, "name": "/rotary/Cos_output_0", "outputIndexes": +[ 45 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 45, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_output_0", "outputIndexes": +[ 46 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 44 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SIN", "T": "DT_FLOAT" } +, "name": "/rotary/Sin_output_0", "outputIndexes": +[ 47 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 47, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": +[ 48 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 46, 48 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/rotary/Concat_output_0", "outputIndexes": +[ 49 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 49, 49 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/rotary/Concat_1_output_0", "outputIndexes": +[ 50 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 2 ] + } +, "name": "/rotary/Constant_7_output_0", "outputIndexes": +[ 51 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 50, 51 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": +[ 52 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 52, 19 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": +[ 53 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 53 ] +, "main_type": "NONE", "name": "Shape117", "outputIndexes": +[ 54 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 53 ] +, "main_type": "NONE", "name": "Rank119", "outputIndexes": +[ 55 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 55, 55 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp121", "outputIndexes": +[ 56 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 56 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze122", "outputIndexes": +[ 57 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 56, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp124", "outputIndexes": +[ 58 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 58 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze125", "outputIndexes": +[ 59 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 54, 57, 59, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice128", "outputIndexes": +[ 60 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 60 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze129", "outputIndexes": +[ 61 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 61, 61 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp131", "outputIndexes": +[ 62 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 53, 62, 56 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_2_output_0", "outputIndexes": +[ 63 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 39, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_output_0", "outputIndexes": +[ 64 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 39 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_2_output_0", "outputIndexes": +[ 65 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 3 ] + } +, "name": "/blocks.0/self_attn/Constant_9_output_0", "outputIndexes": +[ 66 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 65 ] +, "main_type": "NONE", "name": "Shape257", "outputIndexes": +[ 67 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 65 ] +, "main_type": "NONE", "name": "Rank259", "outputIndexes": +[ 68 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 68, 68 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp261", "outputIndexes": +[ 69 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 69 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze262", "outputIndexes": +[ 70 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 69, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp264", "outputIndexes": +[ 71 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 71 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze265", "outputIndexes": +[ 72 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 67, 70, 72, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice268", "outputIndexes": +[ 73 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 73 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze269", "outputIndexes": +[ 74 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 74 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp270", "outputIndexes": +[ 75 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 75, 74 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp271", "outputIndexes": +[ 76 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 65, 76, 69 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_4_output_0", "outputIndexes": +[ 77 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 2 ] + } +, "name": "/rotary/Constant_6_output_0", "outputIndexes": +[ 78 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 77, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Div_output_0", "outputIndexes": +[ 79 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 79, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 80 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 1073741824 ] + } +, "name": "/blocks.0/self_attn/Constant_18_output_0", "outputIndexes": +[ 81 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dims": +[ 1 ] +, "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": +[ 3 ] + } +, "name": "/blocks.0/self_attn/Constant_12_output_0", "outputIndexes": +[ 82 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 39, 80, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_1_output_0", "outputIndexes": +[ 83 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 83 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.0/self_attn/Neg_output_0", "outputIndexes": +[ 84 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 79, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 85 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 39, 24, 85, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_output_0", "outputIndexes": +[ 86 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 84, 86 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.0/self_attn/Concat_3_output_0", "outputIndexes": +[ 87 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 56 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze168", "outputIndexes": +[ 88 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 58 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze171", "outputIndexes": +[ 89 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 54, 88, 89, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice174", "outputIndexes": +[ 90 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 90 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze175", "outputIndexes": +[ 91 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 91 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp176", "outputIndexes": +[ 92 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 92, 91 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp177", "outputIndexes": +[ 93 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 53, 93, 56 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_3_output_0", "outputIndexes": +[ 94 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 87, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_1_output_0", "outputIndexes": +[ 95 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 64, 95 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Add_output_0", "outputIndexes": +[ 96 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2969 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 748566, 147478, 36864, 0, 0 ] + } +, "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": +[ 2974 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2974 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 2975 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2975 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 97 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 23, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 98 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 32, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 99 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 98, 99, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_1_output_0", "outputIndexes": +[ 100 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 97, 100 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_1_output_0", "outputIndexes": +[ 101 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 101 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 932908, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.0/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 103 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 103, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_2_output_0", "outputIndexes": +[ 104 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 103 ] +, "main_type": "NONE", "name": "/blocks.0/self_attn/Shape_3_output_0", "outputIndexes": +[ 105 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 105 ] +, "main_type": "NONE", "name": "Shape136", "outputIndexes": +[ 106 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 105 ] +, "main_type": "NONE", "name": "Rank138", "outputIndexes": +[ 107 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 107, 107 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp140", "outputIndexes": +[ 108 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 108 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze141", "outputIndexes": +[ 109 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 108, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp143", "outputIndexes": +[ 110 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 110 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze144", "outputIndexes": +[ 111 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 106, 109, 111, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice147", "outputIndexes": +[ 112 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 112 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze148", "outputIndexes": +[ 113 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 113 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp149", "outputIndexes": +[ 114 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 114, 113 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp150", "outputIndexes": +[ 115 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 105, 115, 108 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.0/self_attn/Gather_5_output_0", "outputIndexes": +[ 116 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 116, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Div_1_output_0", "outputIndexes": +[ 117 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 117, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 118 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 103, 118, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_3_output_0", "outputIndexes": +[ 119 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 119 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.0/self_attn/Neg_1_output_0", "outputIndexes": +[ 120 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 117, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 121 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 103, 24, 121, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.0/self_attn/Slice_2_output_0", "outputIndexes": +[ 122 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 120, 122 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.0/self_attn/Concat_4_output_0", "outputIndexes": +[ 123 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 123, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Mul_3_output_0", "outputIndexes": +[ 124 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 104, 124 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/self_attn/Add_1_output_0", "outputIndexes": +[ 125 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2969 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 934956, 147478, 36864, 0, 0 ] + } +, "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": +[ 2978 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2978 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 2979 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2979 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 126 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 23, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 127 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 32, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.0/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 128 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 127, 128, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.0/self_attn/Concat_2_output_0", "outputIndexes": +[ 129 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 126, 129 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.0/self_attn/Reshape_2_output_0", "outputIndexes": +[ 130 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131 ] +, "main_type": "NONE", "name": "Shape378", "outputIndexes": +[ 132 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 131 ] +, "main_type": "NONE", "name": "Rank380", "outputIndexes": +[ 133 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 133, 133 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp382", "outputIndexes": +[ 134 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze383", "outputIndexes": +[ 135 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp385", "outputIndexes": +[ 136 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze386", "outputIndexes": +[ 137 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 135, 137, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice389", "outputIndexes": +[ 138 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 138 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze390", "outputIndexes": +[ 139 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 139 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp391", "outputIndexes": +[ 140 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 140, 139 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp392", "outputIndexes": +[ 141 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 141, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_1_output_0", "outputIndexes": +[ 142 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 96, 125, 130, 142 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.0/self_attn/Reshape_7_output_0", "outputIndexes": +[ 143 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 143 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 2980 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2980 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 2981 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2981 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1119298, 589846, 147456, 0, 0 ] + } +, "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": +[ 2982 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2982 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 2983 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2983 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 144 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 144 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 1856600, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.0/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 146 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 8, 146 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/Add_output_0", "outputIndexes": +[ 147 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 0.5 ] + } +, "name": "/blocks.0/mlp/act_fn/Constant_3_output_0", "outputIndexes": +[ 148 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 147 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 1865816, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.0/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 149 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 149 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 2984 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2984 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 2985 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2985 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 1875032, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": +[ 2986 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2986 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 2987 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2987 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 150 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 1.0 ] + } +, "name": "/blocks.0/input_layernorm/Constant_2_output_0", "outputIndexes": +[ 151 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 0.797885 ] + } +, "name": "/blocks.0/mlp/act_fn/Constant_1_output_0", "outputIndexes": +[ 152 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "main_type": "Blob", "main": +{ "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": +[ 0.044715 ] + } +, "name": "/blocks.0/mlp/act_fn/Constant_output_0", "outputIndexes": +[ 153 ] +, "type": "Const", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 150 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.0/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 154 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 150, 154 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 155 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 155 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 156 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 150, 156 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Add_output_0", "outputIndexes": +[ 157 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 157 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 158 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 158 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.0/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 159 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 159 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 160 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 150, 160 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 161 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 161 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 162 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2985 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 6851694, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": +[ 2990 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2990 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 2991 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2991 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 163 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 162, 163 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/mlp/Mul_output_0", "outputIndexes": +[ 164 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 164 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 2992 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2992 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 2993 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2993 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 11828356, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": +[ 2994 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2994 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 2995 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2995 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 165 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 165 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 16805018, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.0/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 167 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 147, 167 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.0/Add_1_output_0", "outputIndexes": +[ 168 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 168, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/Reshape_output_0", "outputIndexes": +[ 169 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 169 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 16814234, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.1/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 170 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 170 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 2996 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2996 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 2997 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2997 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 16823450, 589846, 147456, 0, 0 ] + } +, "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": +[ 2998 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2998 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 2999 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2999 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 171 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 170 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_output_0", "outputIndexes": +[ 172 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 172 ] +, "main_type": "NONE", "name": "Shape546", "outputIndexes": +[ 173 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 172 ] +, "main_type": "NONE", "name": "Rank548", "outputIndexes": +[ 174 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 174, 174 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp550", "outputIndexes": +[ 175 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 175 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze551", "outputIndexes": +[ 176 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 175, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp553", "outputIndexes": +[ 177 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 177 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze554", "outputIndexes": +[ 178 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 173, 176, 178, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice557", "outputIndexes": +[ 179 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 179 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze558", "outputIndexes": +[ 180 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 180, 180 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp560", "outputIndexes": +[ 181 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 172, 181, 175 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_output_0", "outputIndexes": +[ 182 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 182, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 183 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 175 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze568", "outputIndexes": +[ 184 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 177 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze571", "outputIndexes": +[ 185 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 173, 184, 185, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice574", "outputIndexes": +[ 186 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 186 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze575", "outputIndexes": +[ 187 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 187 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp576", "outputIndexes": +[ 188 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 188, 187 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp577", "outputIndexes": +[ 189 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 172, 189, 175 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_1_output_0", "outputIndexes": +[ 190 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 190, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 191 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 183, 191, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_output_0", "outputIndexes": +[ 192 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 171, 192 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_output_0", "outputIndexes": +[ 193 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 193 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 17560752, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.1/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 195 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 195, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_output_0", "outputIndexes": +[ 196 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 195 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_2_output_0", "outputIndexes": +[ 197 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 197 ] +, "main_type": "NONE", "name": "Shape694", "outputIndexes": +[ 198 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 197 ] +, "main_type": "NONE", "name": "Rank696", "outputIndexes": +[ 199 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 199, 199 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp698", "outputIndexes": +[ 200 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 200 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze699", "outputIndexes": +[ 201 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 200, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp701", "outputIndexes": +[ 202 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 202 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze702", "outputIndexes": +[ 203 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 198, 201, 203, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice705", "outputIndexes": +[ 204 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 204 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze706", "outputIndexes": +[ 205 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 205 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp707", "outputIndexes": +[ 206 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 206, 205 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp708", "outputIndexes": +[ 207 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 197, 207, 200 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_2_output_0", "outputIndexes": +[ 208 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 208, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Div_output_0", "outputIndexes": +[ 209 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 209, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 210 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 195, 210, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_1_output_0", "outputIndexes": +[ 211 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 211 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.1/self_attn/Neg_output_0", "outputIndexes": +[ 212 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 209, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 213 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 195, 24, 213, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_output_0", "outputIndexes": +[ 214 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 212, 214 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.1/self_attn/Concat_3_output_0", "outputIndexes": +[ 215 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 215, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_1_output_0", "outputIndexes": +[ 216 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 196, 216 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Add_output_0", "outputIndexes": +[ 217 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2997 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 17562800, 147478, 36864, 0, 0 ] + } +, "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": +[ 3002 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3002 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3003 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3003 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 218 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 182, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 219 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 190, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 220 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 219, 220, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_1_output_0", "outputIndexes": +[ 221 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 218, 221 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_1_output_0", "outputIndexes": +[ 222 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 222 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 17747142, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.1/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 224 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_2_output_0", "outputIndexes": +[ 225 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224 ] +, "main_type": "NONE", "name": "/blocks.1/self_attn/Shape_3_output_0", "outputIndexes": +[ 226 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 226 ] +, "main_type": "NONE", "name": "Shape593", "outputIndexes": +[ 227 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 226 ] +, "main_type": "NONE", "name": "Rank595", "outputIndexes": +[ 228 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 228, 228 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp597", "outputIndexes": +[ 229 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 229 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze598", "outputIndexes": +[ 230 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 229, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp600", "outputIndexes": +[ 231 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 231 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze601", "outputIndexes": +[ 232 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 227, 230, 232, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice604", "outputIndexes": +[ 233 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 233 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze605", "outputIndexes": +[ 234 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 234 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp606", "outputIndexes": +[ 235 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 235, 234 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp607", "outputIndexes": +[ 236 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 226, 236, 229 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.1/self_attn/Gather_3_output_0", "outputIndexes": +[ 237 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 237, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Div_1_output_0", "outputIndexes": +[ 238 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 238, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 239 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224, 239, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_3_output_0", "outputIndexes": +[ 240 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 240 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.1/self_attn/Neg_1_output_0", "outputIndexes": +[ 241 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 238, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 242 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 224, 24, 242, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.1/self_attn/Slice_2_output_0", "outputIndexes": +[ 243 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 241, 243 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.1/self_attn/Concat_4_output_0", "outputIndexes": +[ 244 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 244, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Mul_3_output_0", "outputIndexes": +[ 245 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 225, 245 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/self_attn/Add_1_output_0", "outputIndexes": +[ 246 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2997 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 17749190, 147478, 36864, 0, 0 ] + } +, "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": +[ 3006 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3006 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3007 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3007 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 247 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 182, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 248 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 190, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.1/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 249 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 248, 249, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.1/self_attn/Concat_2_output_0", "outputIndexes": +[ 250 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 247, 250 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.1/self_attn/Reshape_2_output_0", "outputIndexes": +[ 251 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze815", "outputIndexes": +[ 252 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze818", "outputIndexes": +[ 253 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 252, 253, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice821", "outputIndexes": +[ 254 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 254 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze822", "outputIndexes": +[ 255 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 255 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp823", "outputIndexes": +[ 256 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 256, 255 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp824", "outputIndexes": +[ 257 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 257, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_3_output_0", "outputIndexes": +[ 258 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 217, 246, 251, 258 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.1/self_attn/Reshape_7_output_0", "outputIndexes": +[ 259 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 259 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3008 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3008 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3009 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3009 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 17933532, 589846, 147456, 0, 0 ] + } +, "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": +[ 3010 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3010 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3011 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3011 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 260 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 260 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 18670834, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.1/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 262 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 169, 262 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/Add_output_0", "outputIndexes": +[ 263 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 263 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 18680050, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.1/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 264 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 264 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3012 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3012 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3013 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3013 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 18689266, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": +[ 3014 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3014 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3015 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3015 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 265 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 265 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.1/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 266 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 265, 266 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 267 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 267 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 268 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 265, 268 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Add_output_0", "outputIndexes": +[ 269 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 269 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 270 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 270 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.1/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 271 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 271 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 272 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 265, 272 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 273 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 273 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 274 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3013 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 23665928, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": +[ 3018 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3018 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3019 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3019 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 275 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 274, 275 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/mlp/Mul_output_0", "outputIndexes": +[ 276 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 276 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3020 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3020 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3021 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3021 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 28642590, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": +[ 3022 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3022 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3023 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3023 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 277 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 277 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 33619252, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.1/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 279 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 263, 279 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.1/Add_1_output_0", "outputIndexes": +[ 280 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 280, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/Reshape_output_0", "outputIndexes": +[ 281 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 281 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 33628468, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.2/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 282 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 282 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3024 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3024 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3025 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3025 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 33637684, 589846, 147456, 0, 0 ] + } +, "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": +[ 3026 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3026 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3027 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3027 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 283 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 282 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_output_0", "outputIndexes": +[ 284 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 284 ] +, "main_type": "NONE", "name": "Shape975", "outputIndexes": +[ 285 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 284 ] +, "main_type": "NONE", "name": "Rank977", "outputIndexes": +[ 286 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 286, 286 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp979", "outputIndexes": +[ 287 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 287 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze980", "outputIndexes": +[ 288 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 287, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp982", "outputIndexes": +[ 289 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 289 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze983", "outputIndexes": +[ 290 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 285, 288, 290, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice986", "outputIndexes": +[ 291 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 291 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze987", "outputIndexes": +[ 292 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 292, 292 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp989", "outputIndexes": +[ 293 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 284, 293, 287 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_output_0", "outputIndexes": +[ 294 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 294, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 295 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 287 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze997", "outputIndexes": +[ 296 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 289 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1000", "outputIndexes": +[ 297 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 285, 296, 297, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1003", "outputIndexes": +[ 298 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 298 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1004", "outputIndexes": +[ 299 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 299 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1005", "outputIndexes": +[ 300 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 300, 299 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1006", "outputIndexes": +[ 301 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 284, 301, 287 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_1_output_0", "outputIndexes": +[ 302 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 302, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 303 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 295, 303, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_output_0", "outputIndexes": +[ 304 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 283, 304 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_output_0", "outputIndexes": +[ 305 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 305 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 34374986, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.2/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 307 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 307, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_output_0", "outputIndexes": +[ 308 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 307 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_2_output_0", "outputIndexes": +[ 309 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 309 ] +, "main_type": "NONE", "name": "Shape1123", "outputIndexes": +[ 310 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 309 ] +, "main_type": "NONE", "name": "Rank1125", "outputIndexes": +[ 311 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 311, 311 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1127", "outputIndexes": +[ 312 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 312 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1128", "outputIndexes": +[ 313 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 312, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1130", "outputIndexes": +[ 314 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 314 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1131", "outputIndexes": +[ 315 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 310, 313, 315, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1134", "outputIndexes": +[ 316 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 316 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1135", "outputIndexes": +[ 317 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 317 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1136", "outputIndexes": +[ 318 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 318, 317 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1137", "outputIndexes": +[ 319 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 309, 319, 312 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_2_output_0", "outputIndexes": +[ 320 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 320, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Div_output_0", "outputIndexes": +[ 321 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 321, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 322 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 307, 322, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_1_output_0", "outputIndexes": +[ 323 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 323 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.2/self_attn/Neg_output_0", "outputIndexes": +[ 324 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 321, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 325 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 307, 24, 325, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_output_0", "outputIndexes": +[ 326 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 324, 326 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.2/self_attn/Concat_3_output_0", "outputIndexes": +[ 327 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 327, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_1_output_0", "outputIndexes": +[ 328 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 308, 328 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Add_output_0", "outputIndexes": +[ 329 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3025 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 34377034, 147478, 36864, 0, 0 ] + } +, "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": +[ 3030 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3030 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3031 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3031 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 330 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 294, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 331 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 302, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 332 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 331, 332, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_1_output_0", "outputIndexes": +[ 333 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 330, 333 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_1_output_0", "outputIndexes": +[ 334 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 334 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 34561376, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.2/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 336 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 336, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_2_output_0", "outputIndexes": +[ 337 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 336 ] +, "main_type": "NONE", "name": "/blocks.2/self_attn/Shape_3_output_0", "outputIndexes": +[ 338 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 338 ] +, "main_type": "NONE", "name": "Shape1022", "outputIndexes": +[ 339 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 338 ] +, "main_type": "NONE", "name": "Rank1024", "outputIndexes": +[ 340 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 340, 340 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1026", "outputIndexes": +[ 341 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 341 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1027", "outputIndexes": +[ 342 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 341, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1029", "outputIndexes": +[ 343 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 343 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1030", "outputIndexes": +[ 344 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 339, 342, 344, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1033", "outputIndexes": +[ 345 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 345 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1034", "outputIndexes": +[ 346 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 346 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1035", "outputIndexes": +[ 347 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 347, 346 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1036", "outputIndexes": +[ 348 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 338, 348, 341 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.2/self_attn/Gather_3_output_0", "outputIndexes": +[ 349 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 349, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Div_1_output_0", "outputIndexes": +[ 350 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 350, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 351 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 336, 351, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_3_output_0", "outputIndexes": +[ 352 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 352 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.2/self_attn/Neg_1_output_0", "outputIndexes": +[ 353 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 350, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 354 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 336, 24, 354, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.2/self_attn/Slice_2_output_0", "outputIndexes": +[ 355 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 353, 355 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.2/self_attn/Concat_4_output_0", "outputIndexes": +[ 356 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 356, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Mul_3_output_0", "outputIndexes": +[ 357 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 337, 357 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/self_attn/Add_1_output_0", "outputIndexes": +[ 358 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3025 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 34563424, 147478, 36864, 0, 0 ] + } +, "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": +[ 3034 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3034 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3035 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3035 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 359 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 294, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 360 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 302, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.2/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 361 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 360, 361, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.2/self_attn/Concat_2_output_0", "outputIndexes": +[ 362 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 359, 362 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.2/self_attn/Reshape_2_output_0", "outputIndexes": +[ 363 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1244", "outputIndexes": +[ 364 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1247", "outputIndexes": +[ 365 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 364, 365, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1250", "outputIndexes": +[ 366 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 366 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1251", "outputIndexes": +[ 367 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 367 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1252", "outputIndexes": +[ 368 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 368, 367 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1253", "outputIndexes": +[ 369 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 369, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_5_output_0", "outputIndexes": +[ 370 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 329, 358, 363, 370 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.2/self_attn/Reshape_7_output_0", "outputIndexes": +[ 371 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 371 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3036 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3036 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3037 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3037 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 34747766, 589846, 147456, 0, 0 ] + } +, "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": +[ 3038 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3038 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3039 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3039 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 372 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 372 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 35485068, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.2/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 374 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 281, 374 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/Add_output_0", "outputIndexes": +[ 375 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 375 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 35494284, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.2/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 376 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 376 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3040 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3040 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3041 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3041 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 35503500, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": +[ 3042 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3042 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3043 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3043 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 377 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 377 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.2/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 378 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 377, 378 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 379 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 379 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 380 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 377, 380 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Add_output_0", "outputIndexes": +[ 381 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 381 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 382 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 382 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.2/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 383 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 383 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 384 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 377, 384 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 385 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 385 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 386 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3041 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 40480162, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": +[ 3046 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3046 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3047 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3047 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 387 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 386, 387 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/mlp/Mul_output_0", "outputIndexes": +[ 388 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 388 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3048 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3048 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3049 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3049 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 45456824, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": +[ 3050 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3050 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3051 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3051 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 389 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 389 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 50433486, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.2/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 391 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 375, 391 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.2/Add_1_output_0", "outputIndexes": +[ 392 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 392, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/Reshape_output_0", "outputIndexes": +[ 393 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 393 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 50442702, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.3/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 394 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 394 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3052 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3052 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3053 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3053 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 50451918, 589846, 147456, 0, 0 ] + } +, "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": +[ 3054 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3054 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3055 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3055 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 395 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 394 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_output_0", "outputIndexes": +[ 396 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 396 ] +, "main_type": "NONE", "name": "Shape1404", "outputIndexes": +[ 397 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 396 ] +, "main_type": "NONE", "name": "Rank1406", "outputIndexes": +[ 398 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 398, 398 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1408", "outputIndexes": +[ 399 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 399 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1409", "outputIndexes": +[ 400 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 399, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1411", "outputIndexes": +[ 401 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 401 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1412", "outputIndexes": +[ 402 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 397, 400, 402, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1415", "outputIndexes": +[ 403 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 403 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1416", "outputIndexes": +[ 404 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 404, 404 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1418", "outputIndexes": +[ 405 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 396, 405, 399 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_output_0", "outputIndexes": +[ 406 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 406, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 407 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 399 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1426", "outputIndexes": +[ 408 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 401 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1429", "outputIndexes": +[ 409 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 397, 408, 409, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1432", "outputIndexes": +[ 410 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 410 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1433", "outputIndexes": +[ 411 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 411 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1434", "outputIndexes": +[ 412 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 412, 411 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1435", "outputIndexes": +[ 413 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 396, 413, 399 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_1_output_0", "outputIndexes": +[ 414 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 414, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 415 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 407, 415, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_output_0", "outputIndexes": +[ 416 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 395, 416 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_output_0", "outputIndexes": +[ 417 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 417 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 51189220, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.3/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 419 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 419, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_output_0", "outputIndexes": +[ 420 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 419 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_2_output_0", "outputIndexes": +[ 421 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 421 ] +, "main_type": "NONE", "name": "Shape1552", "outputIndexes": +[ 422 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 421 ] +, "main_type": "NONE", "name": "Rank1554", "outputIndexes": +[ 423 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 423, 423 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1556", "outputIndexes": +[ 424 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 424 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1557", "outputIndexes": +[ 425 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 424, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1559", "outputIndexes": +[ 426 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 426 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1560", "outputIndexes": +[ 427 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 422, 425, 427, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1563", "outputIndexes": +[ 428 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 428 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1564", "outputIndexes": +[ 429 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 429 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1565", "outputIndexes": +[ 430 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 430, 429 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1566", "outputIndexes": +[ 431 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 421, 431, 424 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_2_output_0", "outputIndexes": +[ 432 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 432, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Div_output_0", "outputIndexes": +[ 433 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 433, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 434 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 419, 434, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_1_output_0", "outputIndexes": +[ 435 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 435 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.3/self_attn/Neg_output_0", "outputIndexes": +[ 436 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 433, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 437 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 419, 24, 437, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_output_0", "outputIndexes": +[ 438 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 436, 438 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.3/self_attn/Concat_3_output_0", "outputIndexes": +[ 439 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 439, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_1_output_0", "outputIndexes": +[ 440 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 420, 440 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Add_output_0", "outputIndexes": +[ 441 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3053 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 51191268, 147478, 36864, 0, 0 ] + } +, "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": +[ 3058 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3058 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3059 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3059 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 442 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 406, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 443 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 414, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 444 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 443, 444, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_1_output_0", "outputIndexes": +[ 445 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 442, 445 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_1_output_0", "outputIndexes": +[ 446 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 446 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 51375610, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.3/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 448 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 448, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_2_output_0", "outputIndexes": +[ 449 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 448 ] +, "main_type": "NONE", "name": "/blocks.3/self_attn/Shape_3_output_0", "outputIndexes": +[ 450 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 450 ] +, "main_type": "NONE", "name": "Shape1451", "outputIndexes": +[ 451 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 450 ] +, "main_type": "NONE", "name": "Rank1453", "outputIndexes": +[ 452 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 452, 452 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1455", "outputIndexes": +[ 453 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1456", "outputIndexes": +[ 454 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 453, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1458", "outputIndexes": +[ 455 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 455 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1459", "outputIndexes": +[ 456 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 451, 454, 456, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1462", "outputIndexes": +[ 457 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 457 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1463", "outputIndexes": +[ 458 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 458 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1464", "outputIndexes": +[ 459 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 459, 458 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1465", "outputIndexes": +[ 460 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 450, 460, 453 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.3/self_attn/Gather_3_output_0", "outputIndexes": +[ 461 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 461, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Div_1_output_0", "outputIndexes": +[ 462 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 462, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 463 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 448, 463, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_3_output_0", "outputIndexes": +[ 464 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 464 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.3/self_attn/Neg_1_output_0", "outputIndexes": +[ 465 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 462, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 466 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 448, 24, 466, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.3/self_attn/Slice_2_output_0", "outputIndexes": +[ 467 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 465, 467 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.3/self_attn/Concat_4_output_0", "outputIndexes": +[ 468 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 468, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Mul_3_output_0", "outputIndexes": +[ 469 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 449, 469 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/self_attn/Add_1_output_0", "outputIndexes": +[ 470 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3053 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 51377658, 147478, 36864, 0, 0 ] + } +, "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": +[ 3062 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3062 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3063 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3063 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 471 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 406, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 472 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 414, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.3/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 473 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 472, 473, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.3/self_attn/Concat_2_output_0", "outputIndexes": +[ 474 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 471, 474 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.3/self_attn/Reshape_2_output_0", "outputIndexes": +[ 475 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1673", "outputIndexes": +[ 476 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1676", "outputIndexes": +[ 477 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 476, 477, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1679", "outputIndexes": +[ 478 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 478 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1680", "outputIndexes": +[ 479 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 479 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1681", "outputIndexes": +[ 480 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 480, 479 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1682", "outputIndexes": +[ 481 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 481, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_7_output_0", "outputIndexes": +[ 482 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 441, 470, 475, 482 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.3/self_attn/Reshape_7_output_0", "outputIndexes": +[ 483 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 483 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3064 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3064 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3065 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3065 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 51562000, 589846, 147456, 0, 0 ] + } +, "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": +[ 3066 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3066 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3067 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3067 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 484 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 484 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 52299302, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.3/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 486 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 393, 486 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/Add_output_0", "outputIndexes": +[ 487 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 487 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 52308518, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.3/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 488 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 488 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3068 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3068 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3069 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3069 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 52317734, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": +[ 3070 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3070 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3071 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3071 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 489 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 489 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.3/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 490 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 489, 490 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 491 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 491 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 492 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 489, 492 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Add_output_0", "outputIndexes": +[ 493 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 493 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 494 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 494 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.3/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 495 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 495 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 496 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 489, 496 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 497 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 497 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 498 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3069 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 57294396, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": +[ 3074 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3074 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3075 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3075 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 499 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 498, 499 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/mlp/Mul_output_0", "outputIndexes": +[ 500 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 500 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3076 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3076 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3077 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3077 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 62271058, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": +[ 3078 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3078 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3079 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3079 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 501 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 501 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 67247720, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.3/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 503 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 487, 503 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.3/Add_1_output_0", "outputIndexes": +[ 504 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 504, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/Reshape_output_0", "outputIndexes": +[ 505 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 505 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 67256936, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.4/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 506 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 506 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3080 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3080 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3081 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3081 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 67266152, 589846, 147456, 0, 0 ] + } +, "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": +[ 3082 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3082 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3083 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3083 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 507 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 506 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_output_0", "outputIndexes": +[ 508 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 508 ] +, "main_type": "NONE", "name": "Shape1833", "outputIndexes": +[ 509 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 508 ] +, "main_type": "NONE", "name": "Rank1835", "outputIndexes": +[ 510 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 510, 510 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1837", "outputIndexes": +[ 511 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 511 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1838", "outputIndexes": +[ 512 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 511, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1840", "outputIndexes": +[ 513 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 513 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1841", "outputIndexes": +[ 514 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 509, 512, 514, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1844", "outputIndexes": +[ 515 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 515 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1845", "outputIndexes": +[ 516 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 516, 516 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1847", "outputIndexes": +[ 517 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 508, 517, 511 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_output_0", "outputIndexes": +[ 518 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 518, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 519 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 511 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1855", "outputIndexes": +[ 520 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 513 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1858", "outputIndexes": +[ 521 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 509, 520, 521, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1861", "outputIndexes": +[ 522 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 522 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1862", "outputIndexes": +[ 523 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 523 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1863", "outputIndexes": +[ 524 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 524, 523 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1864", "outputIndexes": +[ 525 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 508, 525, 511 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_1_output_0", "outputIndexes": +[ 526 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 526, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 527 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 519, 527, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_output_0", "outputIndexes": +[ 528 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 507, 528 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_output_0", "outputIndexes": +[ 529 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 529 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 68003454, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.4/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 531 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 531, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_output_0", "outputIndexes": +[ 532 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 531 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_2_output_0", "outputIndexes": +[ 533 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 533 ] +, "main_type": "NONE", "name": "Shape1982", "outputIndexes": +[ 534 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 533 ] +, "main_type": "NONE", "name": "Rank1984", "outputIndexes": +[ 535 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 535, 535 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1986", "outputIndexes": +[ 536 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 536 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1987", "outputIndexes": +[ 537 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 536, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1989", "outputIndexes": +[ 538 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 538 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1990", "outputIndexes": +[ 539 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 534, 537, 539, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1993", "outputIndexes": +[ 540 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 540 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1994", "outputIndexes": +[ 541 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 541 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1995", "outputIndexes": +[ 542 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 542, 541 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1996", "outputIndexes": +[ 543 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 533, 543, 536 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_2_output_0", "outputIndexes": +[ 544 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 544, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Div_output_0", "outputIndexes": +[ 545 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 545, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 546 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 531, 546, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_1_output_0", "outputIndexes": +[ 547 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 547 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.4/self_attn/Neg_output_0", "outputIndexes": +[ 548 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 545, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 549 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 531, 24, 549, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_output_0", "outputIndexes": +[ 550 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 548, 550 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.4/self_attn/Concat_3_output_0", "outputIndexes": +[ 551 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 551, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_1_output_0", "outputIndexes": +[ 552 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 532, 552 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Add_output_0", "outputIndexes": +[ 553 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3081 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 68005502, 147478, 36864, 0, 0 ] + } +, "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": +[ 3086 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3086 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3087 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3087 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 554 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 518, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 555 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 526, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 556 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 555, 556, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_1_output_0", "outputIndexes": +[ 557 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 554, 557 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_1_output_0", "outputIndexes": +[ 558 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 558 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 68189844, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.4/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 560 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 560, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_2_output_0", "outputIndexes": +[ 561 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 560 ] +, "main_type": "NONE", "name": "/blocks.4/self_attn/Shape_3_output_0", "outputIndexes": +[ 562 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 562 ] +, "main_type": "NONE", "name": "Shape1880", "outputIndexes": +[ 563 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 562 ] +, "main_type": "NONE", "name": "Rank1882", "outputIndexes": +[ 564 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 564, 564 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1884", "outputIndexes": +[ 565 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 565 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1885", "outputIndexes": +[ 566 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 565, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1887", "outputIndexes": +[ 567 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 567 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze1888", "outputIndexes": +[ 568 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 563, 566, 568, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice1891", "outputIndexes": +[ 569 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 569 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze1892", "outputIndexes": +[ 570 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 570 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1893", "outputIndexes": +[ 571 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 571, 570 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp1894", "outputIndexes": +[ 572 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 562, 572, 565 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.4/self_attn/Gather_3_output_0", "outputIndexes": +[ 573 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 573, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Div_1_output_0", "outputIndexes": +[ 574 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 574, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 575 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 560, 575, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_3_output_0", "outputIndexes": +[ 576 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 576 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.4/self_attn/Neg_1_output_0", "outputIndexes": +[ 577 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 574, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 578 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 560, 24, 578, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.4/self_attn/Slice_2_output_0", "outputIndexes": +[ 579 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 577, 579 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.4/self_attn/Concat_4_output_0", "outputIndexes": +[ 580 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 580, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Mul_3_output_0", "outputIndexes": +[ 581 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 561, 581 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/self_attn/Add_1_output_0", "outputIndexes": +[ 582 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3081 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 68191892, 147478, 36864, 0, 0 ] + } +, "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": +[ 3090 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3090 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3091 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3091 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 583 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 518, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 584 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 526, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.4/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 585 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 584, 585, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.4/self_attn/Concat_2_output_0", "outputIndexes": +[ 586 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 583, 586 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.4/self_attn/Reshape_2_output_0", "outputIndexes": +[ 587 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2103", "outputIndexes": +[ 588 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2106", "outputIndexes": +[ 589 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 588, 589, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2109", "outputIndexes": +[ 590 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 590 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2110", "outputIndexes": +[ 591 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 591 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2111", "outputIndexes": +[ 592 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 592, 591 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2112", "outputIndexes": +[ 593 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 593, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_9_output_0", "outputIndexes": +[ 594 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 553, 582, 587, 594 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.4/self_attn/Reshape_7_output_0", "outputIndexes": +[ 595 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 595 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3092 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3092 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3093 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3093 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 68376234, 589846, 147456, 0, 0 ] + } +, "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": +[ 3094 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3094 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3095 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3095 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 596 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 596 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 69113536, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.4/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 598 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 505, 598 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/Add_output_0", "outputIndexes": +[ 599 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 599 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 69122752, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.4/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 600 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 600 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3096 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3096 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3097 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3097 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 69131968, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": +[ 3098 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3098 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3099 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3099 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 601 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.4/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 602 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 602 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 603 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 603 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 604 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 604 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Add_output_0", "outputIndexes": +[ 605 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 605 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 606 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 606 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.4/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 607 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 607 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 608 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 601, 608 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 609 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 609 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 610 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3097 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 74108630, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": +[ 3102 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3102 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3103 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3103 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 611 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 610, 611 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/mlp/Mul_output_0", "outputIndexes": +[ 612 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 612 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3104 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3104 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3105 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3105 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 79085292, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": +[ 3106 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3106 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3107 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3107 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 613 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 613 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 84061954, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.4/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 615 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 599, 615 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.4/Add_1_output_0", "outputIndexes": +[ 616 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 616, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/Reshape_output_0", "outputIndexes": +[ 617 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 617 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 84071170, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.5/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 618 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 618 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3108 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3108 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3109 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3109 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 84080386, 589846, 147456, 0, 0 ] + } +, "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": +[ 3110 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3110 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3111 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3111 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 619 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 618 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_output_0", "outputIndexes": +[ 620 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 620 ] +, "main_type": "NONE", "name": "Shape2263", "outputIndexes": +[ 621 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 620 ] +, "main_type": "NONE", "name": "Rank2265", "outputIndexes": +[ 622 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 622, 622 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2267", "outputIndexes": +[ 623 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 623 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2268", "outputIndexes": +[ 624 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 623, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2270", "outputIndexes": +[ 625 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 625 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2271", "outputIndexes": +[ 626 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 621, 624, 626, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2274", "outputIndexes": +[ 627 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 627 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2275", "outputIndexes": +[ 628 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 628, 628 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2277", "outputIndexes": +[ 629 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 620, 629, 623 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_output_0", "outputIndexes": +[ 630 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 630, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 631 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 623 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2285", "outputIndexes": +[ 632 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 625 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2288", "outputIndexes": +[ 633 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 621, 632, 633, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2291", "outputIndexes": +[ 634 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 634 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2292", "outputIndexes": +[ 635 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 635 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2293", "outputIndexes": +[ 636 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 636, 635 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2294", "outputIndexes": +[ 637 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 620, 637, 623 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_1_output_0", "outputIndexes": +[ 638 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 638, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 639 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 631, 639, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_output_0", "outputIndexes": +[ 640 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 619, 640 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_output_0", "outputIndexes": +[ 641 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 641 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 84817688, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.5/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 643 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 643, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_output_0", "outputIndexes": +[ 644 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 643 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_2_output_0", "outputIndexes": +[ 645 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 645 ] +, "main_type": "NONE", "name": "Shape2412", "outputIndexes": +[ 646 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 645 ] +, "main_type": "NONE", "name": "Rank2414", "outputIndexes": +[ 647 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 647, 647 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2416", "outputIndexes": +[ 648 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 648 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2417", "outputIndexes": +[ 649 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 648, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2419", "outputIndexes": +[ 650 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 650 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2420", "outputIndexes": +[ 651 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 646, 649, 651, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2423", "outputIndexes": +[ 652 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 652 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2424", "outputIndexes": +[ 653 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 653 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2425", "outputIndexes": +[ 654 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 654, 653 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2426", "outputIndexes": +[ 655 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 645, 655, 648 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_2_output_0", "outputIndexes": +[ 656 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 656, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Div_output_0", "outputIndexes": +[ 657 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 657, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 658 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 643, 658, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_1_output_0", "outputIndexes": +[ 659 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 659 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.5/self_attn/Neg_output_0", "outputIndexes": +[ 660 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 657, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 661 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 643, 24, 661, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_output_0", "outputIndexes": +[ 662 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 660, 662 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.5/self_attn/Concat_3_output_0", "outputIndexes": +[ 663 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 663, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_1_output_0", "outputIndexes": +[ 664 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 644, 664 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Add_output_0", "outputIndexes": +[ 665 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3109 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 84819736, 147478, 36864, 0, 0 ] + } +, "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": +[ 3114 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3114 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3115 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3115 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 666 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 630, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 667 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 638, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 668 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 667, 668, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_1_output_0", "outputIndexes": +[ 669 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 666, 669 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_1_output_0", "outputIndexes": +[ 670 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 670 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 85004078, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.5/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 672 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_2_output_0", "outputIndexes": +[ 673 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672 ] +, "main_type": "NONE", "name": "/blocks.5/self_attn/Shape_3_output_0", "outputIndexes": +[ 674 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 674 ] +, "main_type": "NONE", "name": "Shape2310", "outputIndexes": +[ 675 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 674 ] +, "main_type": "NONE", "name": "Rank2312", "outputIndexes": +[ 676 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 676, 676 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2314", "outputIndexes": +[ 677 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 677 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2315", "outputIndexes": +[ 678 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 677, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2317", "outputIndexes": +[ 679 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 679 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2318", "outputIndexes": +[ 680 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 675, 678, 680, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2321", "outputIndexes": +[ 681 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 681 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2322", "outputIndexes": +[ 682 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2323", "outputIndexes": +[ 683 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 683, 682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2324", "outputIndexes": +[ 684 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 674, 684, 677 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.5/self_attn/Gather_3_output_0", "outputIndexes": +[ 685 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 685, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Div_1_output_0", "outputIndexes": +[ 686 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 686, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 687 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672, 687, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_3_output_0", "outputIndexes": +[ 688 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 688 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.5/self_attn/Neg_1_output_0", "outputIndexes": +[ 689 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 686, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 690 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 672, 24, 690, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.5/self_attn/Slice_2_output_0", "outputIndexes": +[ 691 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 689, 691 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.5/self_attn/Concat_4_output_0", "outputIndexes": +[ 692 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 692, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Mul_3_output_0", "outputIndexes": +[ 693 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 673, 693 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/self_attn/Add_1_output_0", "outputIndexes": +[ 694 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3109 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 85006126, 147478, 36864, 0, 0 ] + } +, "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": +[ 3118 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3118 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3119 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3119 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 695 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 630, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 696 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 638, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.5/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 697 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 696, 697, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.5/self_attn/Concat_2_output_0", "outputIndexes": +[ 698 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 695, 698 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.5/self_attn/Reshape_2_output_0", "outputIndexes": +[ 699 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2533", "outputIndexes": +[ 700 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2536", "outputIndexes": +[ 701 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 700, 701, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2539", "outputIndexes": +[ 702 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 702 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2540", "outputIndexes": +[ 703 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 703, 703 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2542", "outputIndexes": +[ 704 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 704, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_11_output_0", "outputIndexes": +[ 705 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 665, 694, 699, 705 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.5/self_attn/Reshape_7_output_0", "outputIndexes": +[ 706 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 706 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3120 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3120 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3121 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3121 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 85190468, 589846, 147456, 0, 0 ] + } +, "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": +[ 3122 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3122 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3123 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3123 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 707 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 707 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 85927770, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.5/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 709 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 617, 709 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/Add_output_0", "outputIndexes": +[ 710 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 710 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 85936986, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.5/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 711 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 711 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3124 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3124 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3125 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3125 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 85946202, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": +[ 3126 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3126 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3127 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3127 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 712 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 712 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.5/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 713 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 712, 713 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 714 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 714 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 715 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 712, 715 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Add_output_0", "outputIndexes": +[ 716 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 716 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 717 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 717 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.5/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 718 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 718 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 719 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 712, 719 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 720 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 720 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 721 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3125 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 90922864, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": +[ 3130 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3130 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3131 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3131 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 722 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 721, 722 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/mlp/Mul_output_0", "outputIndexes": +[ 723 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 723 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3132 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3132 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3133 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3133 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 95899526, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": +[ 3134 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3134 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3135 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3135 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 724 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 724 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 100876188, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.5/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 726 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 710, 726 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.5/Add_1_output_0", "outputIndexes": +[ 727 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 727, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/Reshape_output_0", "outputIndexes": +[ 728 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 728 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 100885404, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.6/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 729 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 729 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3136 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3136 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3137 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3137 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 100894620, 589846, 147456, 0, 0 ] + } +, "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": +[ 3138 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3138 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3139 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3139 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 730 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 729 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_output_0", "outputIndexes": +[ 731 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 731 ] +, "main_type": "NONE", "name": "Shape2693", "outputIndexes": +[ 732 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 731 ] +, "main_type": "NONE", "name": "Rank2695", "outputIndexes": +[ 733 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 733, 733 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2697", "outputIndexes": +[ 734 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 734 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2698", "outputIndexes": +[ 735 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 734, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2700", "outputIndexes": +[ 736 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 736 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2701", "outputIndexes": +[ 737 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 732, 735, 737, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2704", "outputIndexes": +[ 738 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 738 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2705", "outputIndexes": +[ 739 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 739, 739 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2707", "outputIndexes": +[ 740 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 731, 740, 734 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_output_0", "outputIndexes": +[ 741 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 741, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 742 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 734 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2715", "outputIndexes": +[ 743 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 736 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2718", "outputIndexes": +[ 744 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 732, 743, 744, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2721", "outputIndexes": +[ 745 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 745 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2722", "outputIndexes": +[ 746 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 746 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2723", "outputIndexes": +[ 747 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 747, 746 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2724", "outputIndexes": +[ 748 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 731, 748, 734 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_1_output_0", "outputIndexes": +[ 749 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 749, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 750 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 742, 750, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_output_0", "outputIndexes": +[ 751 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 730, 751 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_output_0", "outputIndexes": +[ 752 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 752 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 101631922, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.6/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 754 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 754, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_output_0", "outputIndexes": +[ 755 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 754 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_2_output_0", "outputIndexes": +[ 756 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 756 ] +, "main_type": "NONE", "name": "Shape2842", "outputIndexes": +[ 757 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 756 ] +, "main_type": "NONE", "name": "Rank2844", "outputIndexes": +[ 758 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 758, 758 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2846", "outputIndexes": +[ 759 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 759 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2847", "outputIndexes": +[ 760 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 759, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2849", "outputIndexes": +[ 761 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 761 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2850", "outputIndexes": +[ 762 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 757, 760, 762, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2853", "outputIndexes": +[ 763 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 763 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2854", "outputIndexes": +[ 764 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 764 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2855", "outputIndexes": +[ 765 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 765, 764 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2856", "outputIndexes": +[ 766 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 756, 766, 759 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_2_output_0", "outputIndexes": +[ 767 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 767, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Div_output_0", "outputIndexes": +[ 768 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 768, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 769 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 754, 769, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_1_output_0", "outputIndexes": +[ 770 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 770 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.6/self_attn/Neg_output_0", "outputIndexes": +[ 771 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 768, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 772 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 754, 24, 772, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_output_0", "outputIndexes": +[ 773 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 771, 773 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.6/self_attn/Concat_3_output_0", "outputIndexes": +[ 774 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 774, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_1_output_0", "outputIndexes": +[ 775 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 755, 775 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Add_output_0", "outputIndexes": +[ 776 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3137 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 101633970, 147478, 36864, 0, 0 ] + } +, "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": +[ 3142 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3142 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3143 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3143 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 777 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 741, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 778 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 749, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 779 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 778, 779, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_1_output_0", "outputIndexes": +[ 780 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 777, 780 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_1_output_0", "outputIndexes": +[ 781 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 781 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 101818312, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.6/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 783 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 783, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_2_output_0", "outputIndexes": +[ 784 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 783 ] +, "main_type": "NONE", "name": "/blocks.6/self_attn/Shape_3_output_0", "outputIndexes": +[ 785 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 785 ] +, "main_type": "NONE", "name": "Shape2740", "outputIndexes": +[ 786 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 785 ] +, "main_type": "NONE", "name": "Rank2742", "outputIndexes": +[ 787 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 787, 787 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2744", "outputIndexes": +[ 788 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 788 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2745", "outputIndexes": +[ 789 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 788, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2747", "outputIndexes": +[ 790 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 790 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2748", "outputIndexes": +[ 791 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 786, 789, 791, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2751", "outputIndexes": +[ 792 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 792 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2752", "outputIndexes": +[ 793 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 793 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2753", "outputIndexes": +[ 794 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 794, 793 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2754", "outputIndexes": +[ 795 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 785, 795, 788 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.6/self_attn/Gather_3_output_0", "outputIndexes": +[ 796 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 796, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Div_1_output_0", "outputIndexes": +[ 797 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 797, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 798 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 783, 798, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_3_output_0", "outputIndexes": +[ 799 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 799 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.6/self_attn/Neg_1_output_0", "outputIndexes": +[ 800 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 797, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 801 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 783, 24, 801, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.6/self_attn/Slice_2_output_0", "outputIndexes": +[ 802 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 800, 802 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.6/self_attn/Concat_4_output_0", "outputIndexes": +[ 803 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 803, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Mul_3_output_0", "outputIndexes": +[ 804 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 784, 804 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/self_attn/Add_1_output_0", "outputIndexes": +[ 805 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3137 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 101820360, 147478, 36864, 0, 0 ] + } +, "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": +[ 3146 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3146 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3147 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3147 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 806 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 741, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 807 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 749, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.6/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 808 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 807, 808, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.6/self_attn/Concat_2_output_0", "outputIndexes": +[ 809 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 806, 809 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.6/self_attn/Reshape_2_output_0", "outputIndexes": +[ 810 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2963", "outputIndexes": +[ 811 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze2966", "outputIndexes": +[ 812 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 811, 812, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice2969", "outputIndexes": +[ 813 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 813 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze2970", "outputIndexes": +[ 814 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 814 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2971", "outputIndexes": +[ 815 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 815, 814 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp2972", "outputIndexes": +[ 816 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 816, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_13_output_0", "outputIndexes": +[ 817 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 776, 805, 810, 817 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.6/self_attn/Reshape_7_output_0", "outputIndexes": +[ 818 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 818 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3148 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3148 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3149 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3149 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 102004702, 589846, 147456, 0, 0 ] + } +, "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": +[ 3150 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3150 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3151 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3151 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 819 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 819 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 102742004, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.6/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 821 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 728, 821 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/Add_output_0", "outputIndexes": +[ 822 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 822 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 102751220, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.6/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 823 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 823 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3152 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3152 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3153 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3153 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 102760436, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": +[ 3154 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3154 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3155 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3155 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 824 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 824 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.6/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 825 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 824, 825 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 826 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 826 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 827 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 824, 827 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Add_output_0", "outputIndexes": +[ 828 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 828 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 829 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 829 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.6/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 830 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 830 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 831 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 824, 831 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 832 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 832 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 833 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3153 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 107737098, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": +[ 3158 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3158 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3159 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3159 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 834 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 833, 834 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/mlp/Mul_output_0", "outputIndexes": +[ 835 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 835 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3160 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3160 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3161 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3161 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 112713760, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": +[ 3162 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3162 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3163 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3163 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 836 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 836 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 117690422, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.6/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 838 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 822, 838 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.6/Add_1_output_0", "outputIndexes": +[ 839 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 839, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/Reshape_output_0", "outputIndexes": +[ 840 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 840 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 117699638, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.7/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 841 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 841 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3164 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3164 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3165 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3165 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 117708854, 589846, 147456, 0, 0 ] + } +, "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": +[ 3166 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3166 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3167 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3167 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 842 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 841 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_output_0", "outputIndexes": +[ 843 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 843 ] +, "main_type": "NONE", "name": "Shape3123", "outputIndexes": +[ 844 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 843 ] +, "main_type": "NONE", "name": "Rank3125", "outputIndexes": +[ 845 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 845, 845 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3127", "outputIndexes": +[ 846 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 846 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3128", "outputIndexes": +[ 847 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 846, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3130", "outputIndexes": +[ 848 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 848 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3131", "outputIndexes": +[ 849 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 844, 847, 849, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3134", "outputIndexes": +[ 850 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 850 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3135", "outputIndexes": +[ 851 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 851, 851 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3137", "outputIndexes": +[ 852 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 843, 852, 846 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_output_0", "outputIndexes": +[ 853 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 854 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 846 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3145", "outputIndexes": +[ 855 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 848 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3148", "outputIndexes": +[ 856 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 844, 855, 856, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3151", "outputIndexes": +[ 857 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 857 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3152", "outputIndexes": +[ 858 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 858 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3153", "outputIndexes": +[ 859 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 859, 858 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3154", "outputIndexes": +[ 860 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 843, 860, 846 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_1_output_0", "outputIndexes": +[ 861 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 861, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 862 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 854, 862, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_output_0", "outputIndexes": +[ 863 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 842, 863 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_output_0", "outputIndexes": +[ 864 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 864 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 118446156, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.7/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 866 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 866, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_output_0", "outputIndexes": +[ 867 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 866 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_2_output_0", "outputIndexes": +[ 868 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 868 ] +, "main_type": "NONE", "name": "Shape3272", "outputIndexes": +[ 869 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 868 ] +, "main_type": "NONE", "name": "Rank3274", "outputIndexes": +[ 870 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 870, 870 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3276", "outputIndexes": +[ 871 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3277", "outputIndexes": +[ 872 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 871, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3279", "outputIndexes": +[ 873 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 873 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3280", "outputIndexes": +[ 874 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 869, 872, 874, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3283", "outputIndexes": +[ 875 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 875 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3284", "outputIndexes": +[ 876 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 876 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3285", "outputIndexes": +[ 877 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 877, 876 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3286", "outputIndexes": +[ 878 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 868, 878, 871 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_2_output_0", "outputIndexes": +[ 879 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 879, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Div_output_0", "outputIndexes": +[ 880 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 880, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 881 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 866, 881, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_1_output_0", "outputIndexes": +[ 882 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 882 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.7/self_attn/Neg_output_0", "outputIndexes": +[ 883 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 880, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 884 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 866, 24, 884, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_output_0", "outputIndexes": +[ 885 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 883, 885 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.7/self_attn/Concat_3_output_0", "outputIndexes": +[ 886 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 886, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_1_output_0", "outputIndexes": +[ 887 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 867, 887 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Add_output_0", "outputIndexes": +[ 888 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3165 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 118448204, 147478, 36864, 0, 0 ] + } +, "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": +[ 3170 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3170 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3171 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3171 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 889 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 890 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 861, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 891 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 890, 891, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_1_output_0", "outputIndexes": +[ 892 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 889, 892 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_1_output_0", "outputIndexes": +[ 893 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 893 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 118632546, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.7/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 895 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 895, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_2_output_0", "outputIndexes": +[ 896 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 895 ] +, "main_type": "NONE", "name": "/blocks.7/self_attn/Shape_3_output_0", "outputIndexes": +[ 897 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 897 ] +, "main_type": "NONE", "name": "Shape3170", "outputIndexes": +[ 898 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 897 ] +, "main_type": "NONE", "name": "Rank3172", "outputIndexes": +[ 899 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 899, 899 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3174", "outputIndexes": +[ 900 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 900 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3175", "outputIndexes": +[ 901 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 900, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3177", "outputIndexes": +[ 902 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 902 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3178", "outputIndexes": +[ 903 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 898, 901, 903, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3181", "outputIndexes": +[ 904 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 904 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3182", "outputIndexes": +[ 905 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 905 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3183", "outputIndexes": +[ 906 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 906, 905 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3184", "outputIndexes": +[ 907 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 897, 907, 900 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.7/self_attn/Gather_3_output_0", "outputIndexes": +[ 908 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 908, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Div_1_output_0", "outputIndexes": +[ 909 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 909, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 910 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 895, 910, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_3_output_0", "outputIndexes": +[ 911 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 911 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.7/self_attn/Neg_1_output_0", "outputIndexes": +[ 912 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 909, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 913 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 895, 24, 913, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.7/self_attn/Slice_2_output_0", "outputIndexes": +[ 914 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 912, 914 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.7/self_attn/Concat_4_output_0", "outputIndexes": +[ 915 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 915, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Mul_3_output_0", "outputIndexes": +[ 916 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 896, 916 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/self_attn/Add_1_output_0", "outputIndexes": +[ 917 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3165 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 118634594, 147478, 36864, 0, 0 ] + } +, "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": +[ 3174 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3174 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3175 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3175 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 918 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 853, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 919 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 861, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.7/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 920 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 919, 920, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.7/self_attn/Concat_2_output_0", "outputIndexes": +[ 921 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 918, 921 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.7/self_attn/Reshape_2_output_0", "outputIndexes": +[ 922 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3393", "outputIndexes": +[ 923 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3396", "outputIndexes": +[ 924 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 923, 924, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3399", "outputIndexes": +[ 925 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 925 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3400", "outputIndexes": +[ 926 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 926 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3401", "outputIndexes": +[ 927 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 927, 926 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3402", "outputIndexes": +[ 928 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 928, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_15_output_0", "outputIndexes": +[ 929 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 888, 917, 922, 929 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.7/self_attn/Reshape_7_output_0", "outputIndexes": +[ 930 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 930 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3176 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3176 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3177 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3177 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 118818936, 589846, 147456, 0, 0 ] + } +, "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": +[ 3178 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3178 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3179 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3179 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 931 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 931 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 119556238, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.7/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 933 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 840, 933 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/Add_output_0", "outputIndexes": +[ 934 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 934 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 119565454, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.7/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 935 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 935 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3180 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3180 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3181 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3181 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 119574670, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": +[ 3182 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3182 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3183 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3183 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 936 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.7/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 937 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936, 937 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 938 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 938 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 939 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936, 939 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Add_output_0", "outputIndexes": +[ 940 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 940 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 941 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 941 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.7/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 942 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 942 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 943 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 936, 943 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 944 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 944 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 945 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3181 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 124551332, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": +[ 3186 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3186 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3187 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3187 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 946 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 945, 946 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/mlp/Mul_output_0", "outputIndexes": +[ 947 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 947 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3188 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3188 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3189 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3189 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 129527994, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": +[ 3190 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3190 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3191 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3191 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 948 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 948 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 134504656, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.7/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 950 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 934, 950 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.7/Add_1_output_0", "outputIndexes": +[ 951 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 951, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/Reshape_output_0", "outputIndexes": +[ 952 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 952 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 134513872, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.8/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 953 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 953 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3192 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3192 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3193 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3193 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 134523088, 589846, 147456, 0, 0 ] + } +, "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": +[ 3194 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3194 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3195 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3195 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 954 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 953 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_output_0", "outputIndexes": +[ 955 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 955 ] +, "main_type": "NONE", "name": "Shape3553", "outputIndexes": +[ 956 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 955 ] +, "main_type": "NONE", "name": "Rank3555", "outputIndexes": +[ 957 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 957, 957 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3557", "outputIndexes": +[ 958 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 958 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3558", "outputIndexes": +[ 959 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 958, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3560", "outputIndexes": +[ 960 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3561", "outputIndexes": +[ 961 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 956, 959, 961, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3564", "outputIndexes": +[ 962 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 962 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3565", "outputIndexes": +[ 963 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 963, 963 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3567", "outputIndexes": +[ 964 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 955, 964, 958 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_output_0", "outputIndexes": +[ 965 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 965, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 966 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 958 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3575", "outputIndexes": +[ 967 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 960 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3578", "outputIndexes": +[ 968 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 956, 967, 968, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3581", "outputIndexes": +[ 969 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 969 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3582", "outputIndexes": +[ 970 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3583", "outputIndexes": +[ 971 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 971, 970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3584", "outputIndexes": +[ 972 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 955, 972, 958 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_1_output_0", "outputIndexes": +[ 973 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 973, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 974 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 966, 974, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_output_0", "outputIndexes": +[ 975 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 954, 975 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_output_0", "outputIndexes": +[ 976 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 976 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 135260390, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.8/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 978 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 978, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_output_0", "outputIndexes": +[ 979 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 978 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_2_output_0", "outputIndexes": +[ 980 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 980 ] +, "main_type": "NONE", "name": "Shape3702", "outputIndexes": +[ 981 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 980 ] +, "main_type": "NONE", "name": "Rank3704", "outputIndexes": +[ 982 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 982, 982 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3706", "outputIndexes": +[ 983 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 983 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3707", "outputIndexes": +[ 984 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 983, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3709", "outputIndexes": +[ 985 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 985 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3710", "outputIndexes": +[ 986 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 981, 984, 986, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3713", "outputIndexes": +[ 987 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 987 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3714", "outputIndexes": +[ 988 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 988 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3715", "outputIndexes": +[ 989 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 989, 988 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3716", "outputIndexes": +[ 990 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 980, 990, 983 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_2_output_0", "outputIndexes": +[ 991 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 991, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Div_output_0", "outputIndexes": +[ 992 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 992, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 993 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 978, 993, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_1_output_0", "outputIndexes": +[ 994 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 994 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.8/self_attn/Neg_output_0", "outputIndexes": +[ 995 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 992, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 996 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 978, 24, 996, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_output_0", "outputIndexes": +[ 997 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 995, 997 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.8/self_attn/Concat_3_output_0", "outputIndexes": +[ 998 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 998, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_1_output_0", "outputIndexes": +[ 999 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 979, 999 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Add_output_0", "outputIndexes": +[ 1000 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3193 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 135262438, 147478, 36864, 0, 0 ] + } +, "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": +[ 3198 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3198 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3199 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3199 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1001 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 965, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1002 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 973, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1003 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1002, 1003, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_1_output_0", "outputIndexes": +[ 1004 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1001, 1004 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1005 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1005 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 135446780, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.8/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1007 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1007, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_2_output_0", "outputIndexes": +[ 1008 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1007 ] +, "main_type": "NONE", "name": "/blocks.8/self_attn/Shape_3_output_0", "outputIndexes": +[ 1009 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1009 ] +, "main_type": "NONE", "name": "Shape3600", "outputIndexes": +[ 1010 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1009 ] +, "main_type": "NONE", "name": "Rank3602", "outputIndexes": +[ 1011 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1011, 1011 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3604", "outputIndexes": +[ 1012 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1012 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3605", "outputIndexes": +[ 1013 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1012, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3607", "outputIndexes": +[ 1014 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1014 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3608", "outputIndexes": +[ 1015 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1010, 1013, 1015, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3611", "outputIndexes": +[ 1016 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1016 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3612", "outputIndexes": +[ 1017 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1017 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3613", "outputIndexes": +[ 1018 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1018, 1017 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3614", "outputIndexes": +[ 1019 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1009, 1019, 1012 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.8/self_attn/Gather_3_output_0", "outputIndexes": +[ 1020 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1020, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Div_1_output_0", "outputIndexes": +[ 1021 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1021, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1022 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1007, 1022, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_3_output_0", "outputIndexes": +[ 1023 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1023 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.8/self_attn/Neg_1_output_0", "outputIndexes": +[ 1024 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1021, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1025 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1007, 24, 1025, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.8/self_attn/Slice_2_output_0", "outputIndexes": +[ 1026 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1024, 1026 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.8/self_attn/Concat_4_output_0", "outputIndexes": +[ 1027 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1027, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Mul_3_output_0", "outputIndexes": +[ 1028 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1008, 1028 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/self_attn/Add_1_output_0", "outputIndexes": +[ 1029 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3193 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 135448828, 147478, 36864, 0, 0 ] + } +, "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": +[ 3202 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3202 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3203 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3203 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1030 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 965, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1031 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 973, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.8/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1032 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1031, 1032, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.8/self_attn/Concat_2_output_0", "outputIndexes": +[ 1033 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1030, 1033 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.8/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1034 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3823", "outputIndexes": +[ 1035 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3826", "outputIndexes": +[ 1036 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1035, 1036, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3829", "outputIndexes": +[ 1037 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1037 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3830", "outputIndexes": +[ 1038 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1038 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3831", "outputIndexes": +[ 1039 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1039, 1038 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3832", "outputIndexes": +[ 1040 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1040, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_17_output_0", "outputIndexes": +[ 1041 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1000, 1029, 1034, 1041 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.8/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1042 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1042 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3204 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3204 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3205 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3205 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 135633170, 589846, 147456, 0, 0 ] + } +, "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": +[ 3206 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3206 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3207 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3207 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1043 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1043 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 136370472, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.8/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1045 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 952, 1045 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/Add_output_0", "outputIndexes": +[ 1046 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1046 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 136379688, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.8/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1047 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1047 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3208 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3208 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3209 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3209 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 136388904, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": +[ 3210 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3210 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3211 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3211 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1048 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1048 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.8/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1049 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1048, 1049 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1050 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1050 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1051 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1048, 1051 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1052 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1052 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1053 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1053 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.8/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1054 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1054 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1055 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1048, 1055 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1056 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1056 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1057 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3209 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 141365566, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": +[ 3214 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3214 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3215 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3215 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1058 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1057, 1058 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/mlp/Mul_output_0", "outputIndexes": +[ 1059 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1059 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3216 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3216 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3217 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3217 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 146342228, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": +[ 3218 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3218 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3219 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3219 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1060 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1060 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 151318890, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.8/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1062 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1046, 1062 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.8/Add_1_output_0", "outputIndexes": +[ 1063 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1063, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/Reshape_output_0", "outputIndexes": +[ 1064 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1064 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 151328106, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.9/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1065 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1065 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3220 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3220 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3221 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3221 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 151337322, 589846, 147456, 0, 0 ] + } +, "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": +[ 3222 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3222 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3223 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3223 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1066 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1065 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_output_0", "outputIndexes": +[ 1067 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1067 ] +, "main_type": "NONE", "name": "Shape3983", "outputIndexes": +[ 1068 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1067 ] +, "main_type": "NONE", "name": "Rank3985", "outputIndexes": +[ 1069 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1069, 1069 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3987", "outputIndexes": +[ 1070 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1070 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3988", "outputIndexes": +[ 1071 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1070, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3990", "outputIndexes": +[ 1072 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1072 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze3991", "outputIndexes": +[ 1073 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1068, 1071, 1073, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice3994", "outputIndexes": +[ 1074 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1074 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze3995", "outputIndexes": +[ 1075 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1075, 1075 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp3997", "outputIndexes": +[ 1076 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1067, 1076, 1070 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_output_0", "outputIndexes": +[ 1077 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1077, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1078 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1070 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4005", "outputIndexes": +[ 1079 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1072 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4008", "outputIndexes": +[ 1080 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1068, 1079, 1080, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4011", "outputIndexes": +[ 1081 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1081 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4012", "outputIndexes": +[ 1082 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1082 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4013", "outputIndexes": +[ 1083 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1083, 1082 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4014", "outputIndexes": +[ 1084 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1067, 1084, 1070 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_1_output_0", "outputIndexes": +[ 1085 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1085, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1086 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1078, 1086, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_output_0", "outputIndexes": +[ 1087 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1066, 1087 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_output_0", "outputIndexes": +[ 1088 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1088 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 152074624, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.9/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1090 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_output_0", "outputIndexes": +[ 1091 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_2_output_0", "outputIndexes": +[ 1092 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1092 ] +, "main_type": "NONE", "name": "Shape4132", "outputIndexes": +[ 1093 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1092 ] +, "main_type": "NONE", "name": "Rank4134", "outputIndexes": +[ 1094 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1094, 1094 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4136", "outputIndexes": +[ 1095 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1095 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4137", "outputIndexes": +[ 1096 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1095, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4139", "outputIndexes": +[ 1097 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1097 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4140", "outputIndexes": +[ 1098 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1093, 1096, 1098, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4143", "outputIndexes": +[ 1099 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1099 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4144", "outputIndexes": +[ 1100 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1100 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4145", "outputIndexes": +[ 1101 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1101, 1100 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4146", "outputIndexes": +[ 1102 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1092, 1102, 1095 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_2_output_0", "outputIndexes": +[ 1103 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1103, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Div_output_0", "outputIndexes": +[ 1104 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1104, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1105 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090, 1105, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_1_output_0", "outputIndexes": +[ 1106 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1106 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.9/self_attn/Neg_output_0", "outputIndexes": +[ 1107 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1104, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1108 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1090, 24, 1108, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_output_0", "outputIndexes": +[ 1109 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1107, 1109 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.9/self_attn/Concat_3_output_0", "outputIndexes": +[ 1110 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1110, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_1_output_0", "outputIndexes": +[ 1111 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1091, 1111 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Add_output_0", "outputIndexes": +[ 1112 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3221 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 152076672, 147478, 36864, 0, 0 ] + } +, "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": +[ 3226 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3226 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3227 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3227 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1113 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1077, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1114 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1085, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1115 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1114, 1115, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_1_output_0", "outputIndexes": +[ 1116 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1113, 1116 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1117 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1117 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 152261014, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.9/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1119 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1119, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_2_output_0", "outputIndexes": +[ 1120 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1119 ] +, "main_type": "NONE", "name": "/blocks.9/self_attn/Shape_3_output_0", "outputIndexes": +[ 1121 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1121 ] +, "main_type": "NONE", "name": "Shape4030", "outputIndexes": +[ 1122 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1121 ] +, "main_type": "NONE", "name": "Rank4032", "outputIndexes": +[ 1123 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1123, 1123 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4034", "outputIndexes": +[ 1124 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1124 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4035", "outputIndexes": +[ 1125 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1124, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4037", "outputIndexes": +[ 1126 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1126 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4038", "outputIndexes": +[ 1127 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1122, 1125, 1127, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4041", "outputIndexes": +[ 1128 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1128 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4042", "outputIndexes": +[ 1129 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1129 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4043", "outputIndexes": +[ 1130 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1130, 1129 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4044", "outputIndexes": +[ 1131 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1121, 1131, 1124 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.9/self_attn/Gather_3_output_0", "outputIndexes": +[ 1132 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1132, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Div_1_output_0", "outputIndexes": +[ 1133 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1133, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1134 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1119, 1134, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_3_output_0", "outputIndexes": +[ 1135 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1135 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.9/self_attn/Neg_1_output_0", "outputIndexes": +[ 1136 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1133, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1137 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1119, 24, 1137, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.9/self_attn/Slice_2_output_0", "outputIndexes": +[ 1138 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1136, 1138 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.9/self_attn/Concat_4_output_0", "outputIndexes": +[ 1139 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1139, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Mul_3_output_0", "outputIndexes": +[ 1140 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1120, 1140 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/self_attn/Add_1_output_0", "outputIndexes": +[ 1141 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3221 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 152263062, 147478, 36864, 0, 0 ] + } +, "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": +[ 3230 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3230 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3231 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3231 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1142 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1077, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1143 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1085, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.9/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1144 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1143, 1144, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.9/self_attn/Concat_2_output_0", "outputIndexes": +[ 1145 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1142, 1145 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.9/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1146 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4253", "outputIndexes": +[ 1147 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4256", "outputIndexes": +[ 1148 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1147, 1148, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4259", "outputIndexes": +[ 1149 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1149 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4260", "outputIndexes": +[ 1150 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1150 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4261", "outputIndexes": +[ 1151 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1151, 1150 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4262", "outputIndexes": +[ 1152 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1152, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_19_output_0", "outputIndexes": +[ 1153 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1112, 1141, 1146, 1153 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.9/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1154 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1154 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3232 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3232 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3233 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3233 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 152447404, 589846, 147456, 0, 0 ] + } +, "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": +[ 3234 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3234 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3235 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3235 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1155 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1155 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 153184706, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.9/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1157 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1064, 1157 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/Add_output_0", "outputIndexes": +[ 1158 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1158 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 153193922, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.9/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1159 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1159 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3236 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3236 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3237 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3237 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 153203138, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": +[ 3238 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3238 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3239 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3239 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1160 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1160 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.9/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1161 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1160, 1161 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1162 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1162 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1163 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1160, 1163 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1164 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1164 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1165 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1165 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.9/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1166 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1166 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1167 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1160, 1167 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1168 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1168 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1169 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3237 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 158179800, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": +[ 3242 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3242 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3243 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3243 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1170 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1169, 1170 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/mlp/Mul_output_0", "outputIndexes": +[ 1171 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1171 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3244 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3244 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3245 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3245 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 163156462, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": +[ 3246 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3246 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3247 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3247 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1172 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1172 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 168133124, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.9/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1174 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1158, 1174 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.9/Add_1_output_0", "outputIndexes": +[ 1175 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1175, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/Reshape_output_0", "outputIndexes": +[ 1176 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1176 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 168142340, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.10/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1177 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1177 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3248 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3248 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3249 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3249 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 168151556, 589846, 147456, 0, 0 ] + } +, "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": +[ 3250 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3250 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3251 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3251 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1178 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1177 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_output_0", "outputIndexes": +[ 1179 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1179 ] +, "main_type": "NONE", "name": "Shape4413", "outputIndexes": +[ 1180 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1179 ] +, "main_type": "NONE", "name": "Rank4415", "outputIndexes": +[ 1181 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1181, 1181 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4417", "outputIndexes": +[ 1182 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1182 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4418", "outputIndexes": +[ 1183 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1182, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4420", "outputIndexes": +[ 1184 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1184 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4421", "outputIndexes": +[ 1185 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1180, 1183, 1185, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4424", "outputIndexes": +[ 1186 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1186 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4425", "outputIndexes": +[ 1187 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1187, 1187 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4427", "outputIndexes": +[ 1188 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1179, 1188, 1182 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_output_0", "outputIndexes": +[ 1189 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1189, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1190 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1182 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4435", "outputIndexes": +[ 1191 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1184 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4438", "outputIndexes": +[ 1192 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1180, 1191, 1192, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4441", "outputIndexes": +[ 1193 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1193 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4442", "outputIndexes": +[ 1194 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1194 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4443", "outputIndexes": +[ 1195 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1195, 1194 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4444", "outputIndexes": +[ 1196 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1179, 1196, 1182 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_1_output_0", "outputIndexes": +[ 1197 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1197, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1198 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1190, 1198, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_output_0", "outputIndexes": +[ 1199 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1178, 1199 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_output_0", "outputIndexes": +[ 1200 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1200 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 168888858, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.10/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1202 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1202, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_output_0", "outputIndexes": +[ 1203 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1202 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_2_output_0", "outputIndexes": +[ 1204 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1204 ] +, "main_type": "NONE", "name": "Shape4562", "outputIndexes": +[ 1205 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1204 ] +, "main_type": "NONE", "name": "Rank4564", "outputIndexes": +[ 1206 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1206, 1206 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4566", "outputIndexes": +[ 1207 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1207 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4567", "outputIndexes": +[ 1208 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1207, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4569", "outputIndexes": +[ 1209 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1209 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4570", "outputIndexes": +[ 1210 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1205, 1208, 1210, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4573", "outputIndexes": +[ 1211 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1211 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4574", "outputIndexes": +[ 1212 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1212 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4575", "outputIndexes": +[ 1213 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1213, 1212 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4576", "outputIndexes": +[ 1214 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1204, 1214, 1207 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_2_output_0", "outputIndexes": +[ 1215 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1215, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Div_output_0", "outputIndexes": +[ 1216 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1216, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1217 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1202, 1217, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_1_output_0", "outputIndexes": +[ 1218 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1218 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.10/self_attn/Neg_output_0", "outputIndexes": +[ 1219 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1216, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1220 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1202, 24, 1220, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_output_0", "outputIndexes": +[ 1221 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1219, 1221 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.10/self_attn/Concat_3_output_0", "outputIndexes": +[ 1222 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1222, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_1_output_0", "outputIndexes": +[ 1223 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1203, 1223 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Add_output_0", "outputIndexes": +[ 1224 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3249 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 168890906, 147478, 36864, 0, 0 ] + } +, "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": +[ 3254 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3254 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3255 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3255 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1225 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1189, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1226 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1197, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1227 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1226, 1227, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_1_output_0", "outputIndexes": +[ 1228 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1225, 1228 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1229 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1229 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 169075248, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.10/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1231 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1231, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_2_output_0", "outputIndexes": +[ 1232 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1231 ] +, "main_type": "NONE", "name": "/blocks.10/self_attn/Shape_3_output_0", "outputIndexes": +[ 1233 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1233 ] +, "main_type": "NONE", "name": "Shape4460", "outputIndexes": +[ 1234 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1233 ] +, "main_type": "NONE", "name": "Rank4462", "outputIndexes": +[ 1235 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1235, 1235 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4464", "outputIndexes": +[ 1236 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1236 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4465", "outputIndexes": +[ 1237 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1236, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4467", "outputIndexes": +[ 1238 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1238 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4468", "outputIndexes": +[ 1239 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1234, 1237, 1239, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4471", "outputIndexes": +[ 1240 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1240 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4472", "outputIndexes": +[ 1241 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1241 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4473", "outputIndexes": +[ 1242 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1242, 1241 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4474", "outputIndexes": +[ 1243 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1233, 1243, 1236 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.10/self_attn/Gather_3_output_0", "outputIndexes": +[ 1244 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1244, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Div_1_output_0", "outputIndexes": +[ 1245 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1245, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1246 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1231, 1246, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_3_output_0", "outputIndexes": +[ 1247 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1247 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.10/self_attn/Neg_1_output_0", "outputIndexes": +[ 1248 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1245, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1249 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1231, 24, 1249, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.10/self_attn/Slice_2_output_0", "outputIndexes": +[ 1250 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1248, 1250 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.10/self_attn/Concat_4_output_0", "outputIndexes": +[ 1251 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1251, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Mul_3_output_0", "outputIndexes": +[ 1252 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1232, 1252 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/self_attn/Add_1_output_0", "outputIndexes": +[ 1253 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3249 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 169077296, 147478, 36864, 0, 0 ] + } +, "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": +[ 3258 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3258 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3259 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3259 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1254 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1189, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1255 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1197, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.10/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1256 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1255, 1256, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.10/self_attn/Concat_2_output_0", "outputIndexes": +[ 1257 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1254, 1257 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.10/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1258 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4683", "outputIndexes": +[ 1259 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4686", "outputIndexes": +[ 1260 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1259, 1260, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4689", "outputIndexes": +[ 1261 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1261 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4690", "outputIndexes": +[ 1262 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1262 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4691", "outputIndexes": +[ 1263 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1263, 1262 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4692", "outputIndexes": +[ 1264 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1264, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_21_output_0", "outputIndexes": +[ 1265 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1224, 1253, 1258, 1265 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.10/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1266 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1266 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3260 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3260 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3261 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3261 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 169261638, 589846, 147456, 0, 0 ] + } +, "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": +[ 3262 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3262 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3263 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3263 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1267 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1267 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 169998940, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.10/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1269 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1176, 1269 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/Add_output_0", "outputIndexes": +[ 1270 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1270 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 170008156, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.10/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1271 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1271 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3264 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3264 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3265 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3265 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 170017372, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": +[ 3266 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3266 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3267 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3267 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1272 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1272 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.10/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1273 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1272, 1273 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1274 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1274 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1275 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1272, 1275 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1276 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1276 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1277 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1277 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.10/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1278 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1278 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1279 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1272, 1279 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1280 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1280 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1281 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3265 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 174994034, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": +[ 3270 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3270 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3271 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3271 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1282 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1281, 1282 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/mlp/Mul_output_0", "outputIndexes": +[ 1283 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1283 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3272 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3272 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3273 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3273 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 179970696, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": +[ 3274 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3274 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3275 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3275 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1284 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1284 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 184947358, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.10/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1286 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1270, 1286 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.10/Add_1_output_0", "outputIndexes": +[ 1287 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1287, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/Reshape_output_0", "outputIndexes": +[ 1288 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1288 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 184956574, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.11/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1289 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1289 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3276 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3276 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3277 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3277 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 184965790, 589846, 147456, 0, 0 ] + } +, "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": +[ 3278 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3278 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3279 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3279 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1290 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1289 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_output_0", "outputIndexes": +[ 1291 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1291 ] +, "main_type": "NONE", "name": "Shape4843", "outputIndexes": +[ 1292 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1291 ] +, "main_type": "NONE", "name": "Rank4845", "outputIndexes": +[ 1293 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1293, 1293 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4847", "outputIndexes": +[ 1294 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1294 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4848", "outputIndexes": +[ 1295 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1294, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4850", "outputIndexes": +[ 1296 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1296 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4851", "outputIndexes": +[ 1297 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1292, 1295, 1297, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4854", "outputIndexes": +[ 1298 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1298 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4855", "outputIndexes": +[ 1299 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1299, 1299 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4857", "outputIndexes": +[ 1300 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1291, 1300, 1294 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_output_0", "outputIndexes": +[ 1301 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1301, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1302 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1294 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4865", "outputIndexes": +[ 1303 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1296 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4868", "outputIndexes": +[ 1304 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1292, 1303, 1304, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4871", "outputIndexes": +[ 1305 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1305 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4872", "outputIndexes": +[ 1306 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1306 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4873", "outputIndexes": +[ 1307 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1307, 1306 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4874", "outputIndexes": +[ 1308 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1291, 1308, 1294 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_1_output_0", "outputIndexes": +[ 1309 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1309, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1310 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1302, 1310, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_output_0", "outputIndexes": +[ 1311 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1290, 1311 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_output_0", "outputIndexes": +[ 1312 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1312 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 185703092, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.11/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1314 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1314, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_output_0", "outputIndexes": +[ 1315 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1314 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_2_output_0", "outputIndexes": +[ 1316 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1316 ] +, "main_type": "NONE", "name": "Shape4992", "outputIndexes": +[ 1317 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1316 ] +, "main_type": "NONE", "name": "Rank4994", "outputIndexes": +[ 1318 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1318, 1318 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4996", "outputIndexes": +[ 1319 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1319 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4997", "outputIndexes": +[ 1320 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1319, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4999", "outputIndexes": +[ 1321 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1321 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5000", "outputIndexes": +[ 1322 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1317, 1320, 1322, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5003", "outputIndexes": +[ 1323 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1323 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5004", "outputIndexes": +[ 1324 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1324 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5005", "outputIndexes": +[ 1325 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1325, 1324 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5006", "outputIndexes": +[ 1326 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1316, 1326, 1319 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_2_output_0", "outputIndexes": +[ 1327 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1327, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Div_output_0", "outputIndexes": +[ 1328 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1328, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1329 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1314, 1329, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_1_output_0", "outputIndexes": +[ 1330 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1330 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.11/self_attn/Neg_output_0", "outputIndexes": +[ 1331 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1328, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1332 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1314, 24, 1332, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_output_0", "outputIndexes": +[ 1333 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1331, 1333 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.11/self_attn/Concat_3_output_0", "outputIndexes": +[ 1334 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1334, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_1_output_0", "outputIndexes": +[ 1335 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1315, 1335 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Add_output_0", "outputIndexes": +[ 1336 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3277 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 185705140, 147478, 36864, 0, 0 ] + } +, "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": +[ 3282 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3282 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3283 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3283 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1337 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1301, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1338 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1309, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1339 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1338, 1339, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_1_output_0", "outputIndexes": +[ 1340 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1337, 1340 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1341 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1341 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 185889482, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.11/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1343 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_2_output_0", "outputIndexes": +[ 1344 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343 ] +, "main_type": "NONE", "name": "/blocks.11/self_attn/Shape_3_output_0", "outputIndexes": +[ 1345 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1345 ] +, "main_type": "NONE", "name": "Shape4890", "outputIndexes": +[ 1346 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1345 ] +, "main_type": "NONE", "name": "Rank4892", "outputIndexes": +[ 1347 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1347, 1347 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4894", "outputIndexes": +[ 1348 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1348 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4895", "outputIndexes": +[ 1349 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1348, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4897", "outputIndexes": +[ 1350 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1350 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze4898", "outputIndexes": +[ 1351 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1346, 1349, 1351, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice4901", "outputIndexes": +[ 1352 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1352 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze4902", "outputIndexes": +[ 1353 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1353 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4903", "outputIndexes": +[ 1354 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1354, 1353 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp4904", "outputIndexes": +[ 1355 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1345, 1355, 1348 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.11/self_attn/Gather_3_output_0", "outputIndexes": +[ 1356 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1356, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Div_1_output_0", "outputIndexes": +[ 1357 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1357, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1358 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 1358, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_3_output_0", "outputIndexes": +[ 1359 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1359 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.11/self_attn/Neg_1_output_0", "outputIndexes": +[ 1360 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1357, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1361 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1343, 24, 1361, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.11/self_attn/Slice_2_output_0", "outputIndexes": +[ 1362 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1360, 1362 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.11/self_attn/Concat_4_output_0", "outputIndexes": +[ 1363 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1363, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Mul_3_output_0", "outputIndexes": +[ 1364 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1344, 1364 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/self_attn/Add_1_output_0", "outputIndexes": +[ 1365 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3277 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 185891530, 147478, 36864, 0, 0 ] + } +, "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": +[ 3286 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3286 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3287 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3287 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1366 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1301, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1367 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1309, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.11/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1368 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1367, 1368, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.11/self_attn/Concat_2_output_0", "outputIndexes": +[ 1369 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1366, 1369 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.11/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1370 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5113", "outputIndexes": +[ 1371 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5116", "outputIndexes": +[ 1372 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1371, 1372, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5119", "outputIndexes": +[ 1373 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1373 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5120", "outputIndexes": +[ 1374 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1374, 1374 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5122", "outputIndexes": +[ 1375 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1375, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_23_output_0", "outputIndexes": +[ 1376 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1336, 1365, 1370, 1376 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.11/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1377 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1377 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3288 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3288 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3289 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3289 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 186075872, 589846, 147456, 0, 0 ] + } +, "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": +[ 3290 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3290 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3291 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3291 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1378 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1378 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 186813174, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.11/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1380 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1288, 1380 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/Add_output_0", "outputIndexes": +[ 1381 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1381 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 186822390, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.11/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1382 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1382 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3292 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3292 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3293 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3293 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 186831606, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": +[ 3294 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3294 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3295 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3295 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1383 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1383 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.11/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1384 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1383, 1384 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1385 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1385 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1386 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1383, 1386 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1387 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1387 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1388 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1388 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.11/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1389 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1389 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1390 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1383, 1390 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1391 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1391 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1392 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3293 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 191808268, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": +[ 3298 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3298 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3299 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3299 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1393 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1392, 1393 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/mlp/Mul_output_0", "outputIndexes": +[ 1394 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1394 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3300 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3300 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3301 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3301 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 196784930, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": +[ 3302 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3302 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3303 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3303 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1395 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1395 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 201761592, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.11/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1397 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1381, 1397 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.11/Add_1_output_0", "outputIndexes": +[ 1398 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1398, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/Reshape_output_0", "outputIndexes": +[ 1399 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1399 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 201770808, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.12/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1400 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1400 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3304 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3304 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3305 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3305 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 201780024, 589846, 147456, 0, 0 ] + } +, "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": +[ 3306 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3306 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3307 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3307 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1401 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1400 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_output_0", "outputIndexes": +[ 1402 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1402 ] +, "main_type": "NONE", "name": "Shape5273", "outputIndexes": +[ 1403 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1402 ] +, "main_type": "NONE", "name": "Rank5275", "outputIndexes": +[ 1404 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1404, 1404 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5277", "outputIndexes": +[ 1405 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5278", "outputIndexes": +[ 1406 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5280", "outputIndexes": +[ 1407 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1407 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5281", "outputIndexes": +[ 1408 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1403, 1406, 1408, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5284", "outputIndexes": +[ 1409 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1409 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5285", "outputIndexes": +[ 1410 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1410, 1410 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5287", "outputIndexes": +[ 1411 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1402, 1411, 1405 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_output_0", "outputIndexes": +[ 1412 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1412, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1413 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1405 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5295", "outputIndexes": +[ 1414 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1407 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5298", "outputIndexes": +[ 1415 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1403, 1414, 1415, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5301", "outputIndexes": +[ 1416 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1416 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5302", "outputIndexes": +[ 1417 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1417 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5303", "outputIndexes": +[ 1418 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1418, 1417 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5304", "outputIndexes": +[ 1419 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1402, 1419, 1405 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_1_output_0", "outputIndexes": +[ 1420 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1420, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1421 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1413, 1421, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_output_0", "outputIndexes": +[ 1422 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1401, 1422 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_output_0", "outputIndexes": +[ 1423 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1423 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 202517326, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.12/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1425 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1425, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_output_0", "outputIndexes": +[ 1426 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1425 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_2_output_0", "outputIndexes": +[ 1427 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1427 ] +, "main_type": "NONE", "name": "Shape5422", "outputIndexes": +[ 1428 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1427 ] +, "main_type": "NONE", "name": "Rank5424", "outputIndexes": +[ 1429 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1429, 1429 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5426", "outputIndexes": +[ 1430 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1430 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5427", "outputIndexes": +[ 1431 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1430, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5429", "outputIndexes": +[ 1432 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1432 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5430", "outputIndexes": +[ 1433 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1428, 1431, 1433, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5433", "outputIndexes": +[ 1434 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1434 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5434", "outputIndexes": +[ 1435 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1435 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5435", "outputIndexes": +[ 1436 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1436, 1435 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5436", "outputIndexes": +[ 1437 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1427, 1437, 1430 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_2_output_0", "outputIndexes": +[ 1438 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1438, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Div_output_0", "outputIndexes": +[ 1439 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1439, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1440 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1425, 1440, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_1_output_0", "outputIndexes": +[ 1441 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1441 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.12/self_attn/Neg_output_0", "outputIndexes": +[ 1442 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1439, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1443 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1425, 24, 1443, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_output_0", "outputIndexes": +[ 1444 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1442, 1444 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.12/self_attn/Concat_3_output_0", "outputIndexes": +[ 1445 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1445, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_1_output_0", "outputIndexes": +[ 1446 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1426, 1446 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Add_output_0", "outputIndexes": +[ 1447 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3305 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 202519374, 147478, 36864, 0, 0 ] + } +, "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": +[ 3310 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3310 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3311 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3311 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1448 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1412, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1449 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1420, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1450 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1449, 1450, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_1_output_0", "outputIndexes": +[ 1451 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1448, 1451 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1452 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1452 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 202703716, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.12/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1454 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1454, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_2_output_0", "outputIndexes": +[ 1455 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1454 ] +, "main_type": "NONE", "name": "/blocks.12/self_attn/Shape_3_output_0", "outputIndexes": +[ 1456 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1456 ] +, "main_type": "NONE", "name": "Shape5320", "outputIndexes": +[ 1457 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1456 ] +, "main_type": "NONE", "name": "Rank5322", "outputIndexes": +[ 1458 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1458, 1458 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5324", "outputIndexes": +[ 1459 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1459 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5325", "outputIndexes": +[ 1460 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1459, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5327", "outputIndexes": +[ 1461 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1461 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5328", "outputIndexes": +[ 1462 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1457, 1460, 1462, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5331", "outputIndexes": +[ 1463 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1463 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5332", "outputIndexes": +[ 1464 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1464 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5333", "outputIndexes": +[ 1465 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1465, 1464 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5334", "outputIndexes": +[ 1466 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1456, 1466, 1459 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.12/self_attn/Gather_3_output_0", "outputIndexes": +[ 1467 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1467, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Div_1_output_0", "outputIndexes": +[ 1468 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1468, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1469 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1454, 1469, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_3_output_0", "outputIndexes": +[ 1470 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1470 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.12/self_attn/Neg_1_output_0", "outputIndexes": +[ 1471 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1468, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1472 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1454, 24, 1472, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.12/self_attn/Slice_2_output_0", "outputIndexes": +[ 1473 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1471, 1473 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.12/self_attn/Concat_4_output_0", "outputIndexes": +[ 1474 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1474, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Mul_3_output_0", "outputIndexes": +[ 1475 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1455, 1475 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/self_attn/Add_1_output_0", "outputIndexes": +[ 1476 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3305 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 202705764, 147478, 36864, 0, 0 ] + } +, "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": +[ 3314 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3314 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3315 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3315 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1477 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1412, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1478 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1420, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.12/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1479 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1478, 1479, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.12/self_attn/Concat_2_output_0", "outputIndexes": +[ 1480 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1477, 1480 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.12/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1481 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5543", "outputIndexes": +[ 1482 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5546", "outputIndexes": +[ 1483 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1482, 1483, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5549", "outputIndexes": +[ 1484 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1484 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5550", "outputIndexes": +[ 1485 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1485 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5551", "outputIndexes": +[ 1486 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1486, 1485 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5552", "outputIndexes": +[ 1487 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1487, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_25_output_0", "outputIndexes": +[ 1488 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1447, 1476, 1481, 1488 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.12/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1489 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1489 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3316 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3316 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3317 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3317 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 202890106, 589846, 147456, 0, 0 ] + } +, "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": +[ 3318 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3318 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3319 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3319 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1490 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1490 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 203627408, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.12/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1492 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1399, 1492 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/Add_output_0", "outputIndexes": +[ 1493 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1493 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 203636624, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.12/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1494 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1494 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3320 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3320 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3321 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3321 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 203645840, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": +[ 3322 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3322 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3323 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3323 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1495 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1495 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.12/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1496 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1495, 1496 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1497 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1497 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1498 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1495, 1498 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1499 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1499 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1500 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1500 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.12/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1501 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1501 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1502 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1495, 1502 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1503 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1503 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1504 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3321 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 208622502, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": +[ 3326 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3326 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3327 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3327 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1505 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1504, 1505 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/mlp/Mul_output_0", "outputIndexes": +[ 1506 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1506 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3328 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3328 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3329 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3329 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 213599164, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": +[ 3330 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3330 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3331 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3331 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1507 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1507 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 218575826, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.12/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1509 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1493, 1509 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.12/Add_1_output_0", "outputIndexes": +[ 1510 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1510, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/Reshape_output_0", "outputIndexes": +[ 1511 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1511 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 218585042, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.13/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1512 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1512 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3332 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3332 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3333 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3333 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 218594258, 589846, 147456, 0, 0 ] + } +, "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": +[ 3334 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3334 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3335 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3335 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1513 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1512 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_output_0", "outputIndexes": +[ 1514 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1514 ] +, "main_type": "NONE", "name": "Shape5703", "outputIndexes": +[ 1515 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1514 ] +, "main_type": "NONE", "name": "Rank5705", "outputIndexes": +[ 1516 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1516, 1516 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5707", "outputIndexes": +[ 1517 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1517 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5708", "outputIndexes": +[ 1518 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1517, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5710", "outputIndexes": +[ 1519 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1519 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5711", "outputIndexes": +[ 1520 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1515, 1518, 1520, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5714", "outputIndexes": +[ 1521 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1521 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5715", "outputIndexes": +[ 1522 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1522, 1522 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5717", "outputIndexes": +[ 1523 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1514, 1523, 1517 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_output_0", "outputIndexes": +[ 1524 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1524, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1525 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1517 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5725", "outputIndexes": +[ 1526 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1519 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5728", "outputIndexes": +[ 1527 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1515, 1526, 1527, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5731", "outputIndexes": +[ 1528 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1528 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5732", "outputIndexes": +[ 1529 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1529 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5733", "outputIndexes": +[ 1530 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1530, 1529 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5734", "outputIndexes": +[ 1531 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1514, 1531, 1517 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_1_output_0", "outputIndexes": +[ 1532 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1532, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1533 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1525, 1533, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_output_0", "outputIndexes": +[ 1534 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1513, 1534 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_output_0", "outputIndexes": +[ 1535 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1535 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 219331560, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.13/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1537 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1537, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_output_0", "outputIndexes": +[ 1538 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1537 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_2_output_0", "outputIndexes": +[ 1539 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1539 ] +, "main_type": "NONE", "name": "Shape5852", "outputIndexes": +[ 1540 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1539 ] +, "main_type": "NONE", "name": "Rank5854", "outputIndexes": +[ 1541 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1541, 1541 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5856", "outputIndexes": +[ 1542 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1542 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5857", "outputIndexes": +[ 1543 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1542, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5859", "outputIndexes": +[ 1544 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1544 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5860", "outputIndexes": +[ 1545 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1540, 1543, 1545, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5863", "outputIndexes": +[ 1546 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1546 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5864", "outputIndexes": +[ 1547 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1547 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5865", "outputIndexes": +[ 1548 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1548, 1547 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5866", "outputIndexes": +[ 1549 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1539, 1549, 1542 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_2_output_0", "outputIndexes": +[ 1550 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1550, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Div_output_0", "outputIndexes": +[ 1551 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1551, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1552 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1537, 1552, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_1_output_0", "outputIndexes": +[ 1553 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1553 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.13/self_attn/Neg_output_0", "outputIndexes": +[ 1554 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1551, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1555 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1537, 24, 1555, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_output_0", "outputIndexes": +[ 1556 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1554, 1556 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.13/self_attn/Concat_3_output_0", "outputIndexes": +[ 1557 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1557, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_1_output_0", "outputIndexes": +[ 1558 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1538, 1558 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Add_output_0", "outputIndexes": +[ 1559 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3333 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 219333608, 147478, 36864, 0, 0 ] + } +, "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": +[ 3338 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3338 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3339 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3339 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1560 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1524, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1561 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1532, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1562 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1561, 1562, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_1_output_0", "outputIndexes": +[ 1563 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1560, 1563 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1564 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1564 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 219517950, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.13/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1566 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1566, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_2_output_0", "outputIndexes": +[ 1567 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1566 ] +, "main_type": "NONE", "name": "/blocks.13/self_attn/Shape_3_output_0", "outputIndexes": +[ 1568 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1568 ] +, "main_type": "NONE", "name": "Shape5750", "outputIndexes": +[ 1569 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1568 ] +, "main_type": "NONE", "name": "Rank5752", "outputIndexes": +[ 1570 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1570, 1570 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5754", "outputIndexes": +[ 1571 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1571 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5755", "outputIndexes": +[ 1572 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1571, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5757", "outputIndexes": +[ 1573 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1573 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5758", "outputIndexes": +[ 1574 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1569, 1572, 1574, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5761", "outputIndexes": +[ 1575 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1575 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5762", "outputIndexes": +[ 1576 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1576 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5763", "outputIndexes": +[ 1577 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1577, 1576 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5764", "outputIndexes": +[ 1578 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1568, 1578, 1571 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.13/self_attn/Gather_3_output_0", "outputIndexes": +[ 1579 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1579, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Div_1_output_0", "outputIndexes": +[ 1580 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1580, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1581 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1566, 1581, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_3_output_0", "outputIndexes": +[ 1582 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1582 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.13/self_attn/Neg_1_output_0", "outputIndexes": +[ 1583 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1580, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1584 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1566, 24, 1584, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.13/self_attn/Slice_2_output_0", "outputIndexes": +[ 1585 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1583, 1585 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.13/self_attn/Concat_4_output_0", "outputIndexes": +[ 1586 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1586, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Mul_3_output_0", "outputIndexes": +[ 1587 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1567, 1587 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/self_attn/Add_1_output_0", "outputIndexes": +[ 1588 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3333 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 219519998, 147478, 36864, 0, 0 ] + } +, "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": +[ 3342 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3342 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3343 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3343 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1589 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1524, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1590 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1532, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.13/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1591 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1590, 1591, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.13/self_attn/Concat_2_output_0", "outputIndexes": +[ 1592 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1589, 1592 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.13/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1593 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5973", "outputIndexes": +[ 1594 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze5976", "outputIndexes": +[ 1595 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1594, 1595, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice5979", "outputIndexes": +[ 1596 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1596 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze5980", "outputIndexes": +[ 1597 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1597 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5981", "outputIndexes": +[ 1598 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1598, 1597 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp5982", "outputIndexes": +[ 1599 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1599, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_27_output_0", "outputIndexes": +[ 1600 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1559, 1588, 1593, 1600 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.13/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1601 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1601 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3344 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3344 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3345 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3345 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 219704340, 589846, 147456, 0, 0 ] + } +, "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": +[ 3346 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3346 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3347 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3347 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1602 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1602 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 220441642, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.13/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1604 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1511, 1604 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/Add_output_0", "outputIndexes": +[ 1605 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1605 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 220450858, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.13/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1606 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1606 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3348 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3348 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3349 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3349 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 220460074, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": +[ 3350 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3350 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3351 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3351 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1607 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1607 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.13/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1608 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1607, 1608 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1609 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1609 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1610 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1607, 1610 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1611 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1611 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1612 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1612 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.13/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1613 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1613 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1614 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1607, 1614 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1615 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1615 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1616 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3349 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 225436736, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": +[ 3354 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3354 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3355 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3355 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1617 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1616, 1617 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/mlp/Mul_output_0", "outputIndexes": +[ 1618 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1618 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3356 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3356 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3357 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3357 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 230413398, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": +[ 3358 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3358 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3359 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3359 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1619 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1619 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 235390060, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.13/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1621 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1605, 1621 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.13/Add_1_output_0", "outputIndexes": +[ 1622 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1622, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/Reshape_output_0", "outputIndexes": +[ 1623 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1623 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 235399276, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.14/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1624 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1624 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3360 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3360 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3361 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3361 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 235408492, 589846, 147456, 0, 0 ] + } +, "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": +[ 3362 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3362 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3363 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3363 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1625 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1624 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_output_0", "outputIndexes": +[ 1626 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1626 ] +, "main_type": "NONE", "name": "Shape6133", "outputIndexes": +[ 1627 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1626 ] +, "main_type": "NONE", "name": "Rank6135", "outputIndexes": +[ 1628 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1628, 1628 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6137", "outputIndexes": +[ 1629 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1629 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6138", "outputIndexes": +[ 1630 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1629, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6140", "outputIndexes": +[ 1631 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1631 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6141", "outputIndexes": +[ 1632 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1627, 1630, 1632, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6144", "outputIndexes": +[ 1633 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1633 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6145", "outputIndexes": +[ 1634 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1634, 1634 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6147", "outputIndexes": +[ 1635 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1626, 1635, 1629 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_output_0", "outputIndexes": +[ 1636 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1636, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1637 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1629 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6155", "outputIndexes": +[ 1638 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1631 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6158", "outputIndexes": +[ 1639 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1627, 1638, 1639, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6161", "outputIndexes": +[ 1640 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1640 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6162", "outputIndexes": +[ 1641 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1641 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6163", "outputIndexes": +[ 1642 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1642, 1641 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6164", "outputIndexes": +[ 1643 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1626, 1643, 1629 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_1_output_0", "outputIndexes": +[ 1644 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1644, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1645 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1637, 1645, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_output_0", "outputIndexes": +[ 1646 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1625, 1646 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_output_0", "outputIndexes": +[ 1647 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1647 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 236145794, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.14/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1649 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_output_0", "outputIndexes": +[ 1650 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_2_output_0", "outputIndexes": +[ 1651 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1651 ] +, "main_type": "NONE", "name": "Shape6282", "outputIndexes": +[ 1652 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1651 ] +, "main_type": "NONE", "name": "Rank6284", "outputIndexes": +[ 1653 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1653, 1653 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6286", "outputIndexes": +[ 1654 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1654 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6287", "outputIndexes": +[ 1655 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1654, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6289", "outputIndexes": +[ 1656 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1656 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6290", "outputIndexes": +[ 1657 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1652, 1655, 1657, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6293", "outputIndexes": +[ 1658 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1658 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6294", "outputIndexes": +[ 1659 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1659 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6295", "outputIndexes": +[ 1660 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1660, 1659 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6296", "outputIndexes": +[ 1661 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1651, 1661, 1654 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_2_output_0", "outputIndexes": +[ 1662 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1662, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Div_output_0", "outputIndexes": +[ 1663 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1663, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1664 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649, 1664, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_1_output_0", "outputIndexes": +[ 1665 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1665 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.14/self_attn/Neg_output_0", "outputIndexes": +[ 1666 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1663, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1667 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1649, 24, 1667, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_output_0", "outputIndexes": +[ 1668 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1666, 1668 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.14/self_attn/Concat_3_output_0", "outputIndexes": +[ 1669 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1669, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_1_output_0", "outputIndexes": +[ 1670 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1650, 1670 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Add_output_0", "outputIndexes": +[ 1671 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3361 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 236147842, 147478, 36864, 0, 0 ] + } +, "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": +[ 3366 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3366 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3367 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3367 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1672 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1636, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1673 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1644, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1674 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1673, 1674, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_1_output_0", "outputIndexes": +[ 1675 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1672, 1675 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1676 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1676 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 236332184, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.14/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1678 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1678, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_2_output_0", "outputIndexes": +[ 1679 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1678 ] +, "main_type": "NONE", "name": "/blocks.14/self_attn/Shape_3_output_0", "outputIndexes": +[ 1680 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1680 ] +, "main_type": "NONE", "name": "Shape6180", "outputIndexes": +[ 1681 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1680 ] +, "main_type": "NONE", "name": "Rank6182", "outputIndexes": +[ 1682 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1682, 1682 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6184", "outputIndexes": +[ 1683 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1683 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6185", "outputIndexes": +[ 1684 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1683, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6187", "outputIndexes": +[ 1685 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1685 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6188", "outputIndexes": +[ 1686 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1681, 1684, 1686, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6191", "outputIndexes": +[ 1687 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1687 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6192", "outputIndexes": +[ 1688 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1688 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6193", "outputIndexes": +[ 1689 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1689, 1688 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6194", "outputIndexes": +[ 1690 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1680, 1690, 1683 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.14/self_attn/Gather_3_output_0", "outputIndexes": +[ 1691 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1691, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Div_1_output_0", "outputIndexes": +[ 1692 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1692, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1693 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1678, 1693, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_3_output_0", "outputIndexes": +[ 1694 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1694 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.14/self_attn/Neg_1_output_0", "outputIndexes": +[ 1695 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1692, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1696 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1678, 24, 1696, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.14/self_attn/Slice_2_output_0", "outputIndexes": +[ 1697 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1695, 1697 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.14/self_attn/Concat_4_output_0", "outputIndexes": +[ 1698 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1698, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Mul_3_output_0", "outputIndexes": +[ 1699 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1679, 1699 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/self_attn/Add_1_output_0", "outputIndexes": +[ 1700 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3361 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 236334232, 147478, 36864, 0, 0 ] + } +, "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": +[ 3370 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3370 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3371 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3371 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1701 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1636, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1702 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1644, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.14/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1703 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1702, 1703, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.14/self_attn/Concat_2_output_0", "outputIndexes": +[ 1704 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1701, 1704 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.14/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1705 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6403", "outputIndexes": +[ 1706 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6406", "outputIndexes": +[ 1707 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1706, 1707, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6409", "outputIndexes": +[ 1708 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1708 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6410", "outputIndexes": +[ 1709 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1709 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6411", "outputIndexes": +[ 1710 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1710, 1709 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6412", "outputIndexes": +[ 1711 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1711, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_29_output_0", "outputIndexes": +[ 1712 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1671, 1700, 1705, 1712 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.14/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1713 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1713 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3372 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3372 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3373 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3373 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 236518574, 589846, 147456, 0, 0 ] + } +, "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": +[ 3374 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3374 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3375 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3375 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1714 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1714 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 237255876, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.14/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1716 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1623, 1716 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/Add_output_0", "outputIndexes": +[ 1717 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1717 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 237265092, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.14/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1718 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1718 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3376 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3376 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3377 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3377 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 237274308, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": +[ 3378 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3378 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3379 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3379 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1719 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1719 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.14/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1720 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1719, 1720 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1721 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1721 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1722 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1719, 1722 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1723 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1723 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1724 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1724 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.14/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1725 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1725 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1726 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1719, 1726 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1727 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1727 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1728 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3377 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 242250970, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": +[ 3382 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3382 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3383 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3383 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1729 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1728, 1729 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/mlp/Mul_output_0", "outputIndexes": +[ 1730 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1730 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3384 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3384 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3385 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3385 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 247227632, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": +[ 3386 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3386 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3387 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3387 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1731 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1731 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 252204294, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.14/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1733 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1717, 1733 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.14/Add_1_output_0", "outputIndexes": +[ 1734 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1734, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/Reshape_output_0", "outputIndexes": +[ 1735 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1735 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 252213510, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.15/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1736 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1736 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3388 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3388 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3389 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3389 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 252222726, 589846, 147456, 0, 0 ] + } +, "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": +[ 3390 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3390 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3391 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3391 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1737 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1736 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_output_0", "outputIndexes": +[ 1738 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1738 ] +, "main_type": "NONE", "name": "Shape6563", "outputIndexes": +[ 1739 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1738 ] +, "main_type": "NONE", "name": "Rank6565", "outputIndexes": +[ 1740 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1740, 1740 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6567", "outputIndexes": +[ 1741 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1741 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6568", "outputIndexes": +[ 1742 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1741, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6570", "outputIndexes": +[ 1743 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1743 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6571", "outputIndexes": +[ 1744 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1739, 1742, 1744, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6574", "outputIndexes": +[ 1745 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1745 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6575", "outputIndexes": +[ 1746 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1746, 1746 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6577", "outputIndexes": +[ 1747 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1738, 1747, 1741 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_output_0", "outputIndexes": +[ 1748 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1748, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1749 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1741 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6585", "outputIndexes": +[ 1750 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1743 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6588", "outputIndexes": +[ 1751 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1739, 1750, 1751, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6591", "outputIndexes": +[ 1752 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1752 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6592", "outputIndexes": +[ 1753 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1753 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6593", "outputIndexes": +[ 1754 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1754, 1753 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6594", "outputIndexes": +[ 1755 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1738, 1755, 1741 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_1_output_0", "outputIndexes": +[ 1756 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1756, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1757 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1749, 1757, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_output_0", "outputIndexes": +[ 1758 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1737, 1758 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_output_0", "outputIndexes": +[ 1759 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1759 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 252960028, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.15/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1761 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_output_0", "outputIndexes": +[ 1762 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_2_output_0", "outputIndexes": +[ 1763 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1763 ] +, "main_type": "NONE", "name": "Shape6712", "outputIndexes": +[ 1764 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1763 ] +, "main_type": "NONE", "name": "Rank6714", "outputIndexes": +[ 1765 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1765, 1765 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6716", "outputIndexes": +[ 1766 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1766 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6717", "outputIndexes": +[ 1767 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1766, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6719", "outputIndexes": +[ 1768 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1768 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6720", "outputIndexes": +[ 1769 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1764, 1767, 1769, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6723", "outputIndexes": +[ 1770 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1770 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6724", "outputIndexes": +[ 1771 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6725", "outputIndexes": +[ 1772 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1772, 1771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6726", "outputIndexes": +[ 1773 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1763, 1773, 1766 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_2_output_0", "outputIndexes": +[ 1774 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1774, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Div_output_0", "outputIndexes": +[ 1775 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1775, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1776 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 1776, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_1_output_0", "outputIndexes": +[ 1777 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1777 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.15/self_attn/Neg_output_0", "outputIndexes": +[ 1778 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1775, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1779 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1761, 24, 1779, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_output_0", "outputIndexes": +[ 1780 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1778, 1780 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.15/self_attn/Concat_3_output_0", "outputIndexes": +[ 1781 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1781, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_1_output_0", "outputIndexes": +[ 1782 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1762, 1782 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Add_output_0", "outputIndexes": +[ 1783 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3389 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 252962076, 147478, 36864, 0, 0 ] + } +, "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": +[ 3394 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3394 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3395 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3395 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1784 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1748, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1785 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1756, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1786 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1785, 1786, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_1_output_0", "outputIndexes": +[ 1787 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1784, 1787 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1788 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1788 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 253146418, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.15/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1790 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1790, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_2_output_0", "outputIndexes": +[ 1791 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1790 ] +, "main_type": "NONE", "name": "/blocks.15/self_attn/Shape_3_output_0", "outputIndexes": +[ 1792 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1792 ] +, "main_type": "NONE", "name": "Shape6610", "outputIndexes": +[ 1793 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1792 ] +, "main_type": "NONE", "name": "Rank6612", "outputIndexes": +[ 1794 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1794, 1794 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6614", "outputIndexes": +[ 1795 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1795 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6615", "outputIndexes": +[ 1796 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1795, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6617", "outputIndexes": +[ 1797 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1797 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6618", "outputIndexes": +[ 1798 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1793, 1796, 1798, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6621", "outputIndexes": +[ 1799 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1799 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6622", "outputIndexes": +[ 1800 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1800 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6623", "outputIndexes": +[ 1801 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1801, 1800 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6624", "outputIndexes": +[ 1802 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1792, 1802, 1795 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.15/self_attn/Gather_3_output_0", "outputIndexes": +[ 1803 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1803, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Div_1_output_0", "outputIndexes": +[ 1804 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1804, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1805 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1790, 1805, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_3_output_0", "outputIndexes": +[ 1806 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1806 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.15/self_attn/Neg_1_output_0", "outputIndexes": +[ 1807 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1804, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1808 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1790, 24, 1808, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.15/self_attn/Slice_2_output_0", "outputIndexes": +[ 1809 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1807, 1809 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.15/self_attn/Concat_4_output_0", "outputIndexes": +[ 1810 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1810, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Mul_3_output_0", "outputIndexes": +[ 1811 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1791, 1811 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/self_attn/Add_1_output_0", "outputIndexes": +[ 1812 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3389 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 253148466, 147478, 36864, 0, 0 ] + } +, "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": +[ 3398 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3398 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3399 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3399 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1813 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1748, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1814 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1756, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.15/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1815 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1814, 1815, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.15/self_attn/Concat_2_output_0", "outputIndexes": +[ 1816 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1813, 1816 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.15/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1817 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6833", "outputIndexes": +[ 1818 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6836", "outputIndexes": +[ 1819 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1818, 1819, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice6839", "outputIndexes": +[ 1820 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1820 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze6840", "outputIndexes": +[ 1821 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1821 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6841", "outputIndexes": +[ 1822 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1822, 1821 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6842", "outputIndexes": +[ 1823 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1823, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_31_output_0", "outputIndexes": +[ 1824 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1783, 1812, 1817, 1824 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.15/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1825 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1825 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3400 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3400 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3401 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3401 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 253332808, 589846, 147456, 0, 0 ] + } +, "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": +[ 3402 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3402 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3403 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3403 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1826 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1826 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 254070110, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.15/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1828 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1735, 1828 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/Add_output_0", "outputIndexes": +[ 1829 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1829 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 254079326, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.15/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1830 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1830 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3404 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3404 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3405 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3405 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 254088542, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": +[ 3406 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3406 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3407 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3407 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1831 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1831 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.15/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1832 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1831, 1832 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1833 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1833 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1834 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1831, 1834 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1835 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1835 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1836 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1836 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.15/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1837 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1837 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1838 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1831, 1838 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1839 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1839 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1840 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3405 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 259065204, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": +[ 3410 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3410 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3411 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3411 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1841 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1840, 1841 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/mlp/Mul_output_0", "outputIndexes": +[ 1842 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1842 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3412 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3412 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3413 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3413 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 264041866, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": +[ 3414 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3414 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3415 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3415 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1843 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1843 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 269018528, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.15/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1845 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1829, 1845 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.15/Add_1_output_0", "outputIndexes": +[ 1846 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1846, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/Reshape_output_0", "outputIndexes": +[ 1847 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1847 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 269027744, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.16/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1848 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1848 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3416 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3416 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3417 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3417 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 269036960, 589846, 147456, 0, 0 ] + } +, "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": +[ 3418 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3418 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3419 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3419 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1849 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1848 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_output_0", "outputIndexes": +[ 1850 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1850 ] +, "main_type": "NONE", "name": "Shape6993", "outputIndexes": +[ 1851 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1850 ] +, "main_type": "NONE", "name": "Rank6995", "outputIndexes": +[ 1852 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1852, 1852 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp6997", "outputIndexes": +[ 1853 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1853 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze6998", "outputIndexes": +[ 1854 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1853, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7000", "outputIndexes": +[ 1855 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1855 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7001", "outputIndexes": +[ 1856 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1851, 1854, 1856, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7004", "outputIndexes": +[ 1857 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1857 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7005", "outputIndexes": +[ 1858 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1858, 1858 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7007", "outputIndexes": +[ 1859 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850, 1859, 1853 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_output_0", "outputIndexes": +[ 1860 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1860, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1861 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1853 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7015", "outputIndexes": +[ 1862 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1855 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7018", "outputIndexes": +[ 1863 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1851, 1862, 1863, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7021", "outputIndexes": +[ 1864 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1864 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7022", "outputIndexes": +[ 1865 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1865 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7023", "outputIndexes": +[ 1866 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1866, 1865 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7024", "outputIndexes": +[ 1867 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1850, 1867, 1853 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_1_output_0", "outputIndexes": +[ 1868 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1868, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1869 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1861, 1869, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_output_0", "outputIndexes": +[ 1870 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1849, 1870 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_output_0", "outputIndexes": +[ 1871 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1871 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 269774262, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.16/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1873 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1873, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_output_0", "outputIndexes": +[ 1874 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1873 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_2_output_0", "outputIndexes": +[ 1875 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1875 ] +, "main_type": "NONE", "name": "Shape7142", "outputIndexes": +[ 1876 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1875 ] +, "main_type": "NONE", "name": "Rank7144", "outputIndexes": +[ 1877 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1877, 1877 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7146", "outputIndexes": +[ 1878 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1878 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7147", "outputIndexes": +[ 1879 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1878, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7149", "outputIndexes": +[ 1880 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1880 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7150", "outputIndexes": +[ 1881 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1876, 1879, 1881, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7153", "outputIndexes": +[ 1882 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1882 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7154", "outputIndexes": +[ 1883 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1883 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7155", "outputIndexes": +[ 1884 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1884, 1883 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7156", "outputIndexes": +[ 1885 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1875, 1885, 1878 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_2_output_0", "outputIndexes": +[ 1886 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1886, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Div_output_0", "outputIndexes": +[ 1887 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1887, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 1888 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1873, 1888, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_1_output_0", "outputIndexes": +[ 1889 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1889 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.16/self_attn/Neg_output_0", "outputIndexes": +[ 1890 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1887, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 1891 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1873, 24, 1891, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_output_0", "outputIndexes": +[ 1892 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1890, 1892 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.16/self_attn/Concat_3_output_0", "outputIndexes": +[ 1893 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1893, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_1_output_0", "outputIndexes": +[ 1894 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1874, 1894 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Add_output_0", "outputIndexes": +[ 1895 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3417 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 269776310, 147478, 36864, 0, 0 ] + } +, "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": +[ 3422 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3422 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3423 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3423 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 1896 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1860, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 1897 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1868, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 1898 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1897, 1898, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_1_output_0", "outputIndexes": +[ 1899 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1896, 1899 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_1_output_0", "outputIndexes": +[ 1900 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1900 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 269960652, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.16/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 1902 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1902, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_2_output_0", "outputIndexes": +[ 1903 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1902 ] +, "main_type": "NONE", "name": "/blocks.16/self_attn/Shape_3_output_0", "outputIndexes": +[ 1904 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1904 ] +, "main_type": "NONE", "name": "Shape7040", "outputIndexes": +[ 1905 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1904 ] +, "main_type": "NONE", "name": "Rank7042", "outputIndexes": +[ 1906 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1906, 1906 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7044", "outputIndexes": +[ 1907 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1907 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7045", "outputIndexes": +[ 1908 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1907, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7047", "outputIndexes": +[ 1909 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1909 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7048", "outputIndexes": +[ 1910 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1905, 1908, 1910, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7051", "outputIndexes": +[ 1911 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1911 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7052", "outputIndexes": +[ 1912 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1912 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7053", "outputIndexes": +[ 1913 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1913, 1912 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7054", "outputIndexes": +[ 1914 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1904, 1914, 1907 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.16/self_attn/Gather_3_output_0", "outputIndexes": +[ 1915 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1915, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Div_1_output_0", "outputIndexes": +[ 1916 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1916, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 1917 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1902, 1917, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_3_output_0", "outputIndexes": +[ 1918 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1918 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.16/self_attn/Neg_1_output_0", "outputIndexes": +[ 1919 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1916, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 1920 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1902, 24, 1920, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.16/self_attn/Slice_2_output_0", "outputIndexes": +[ 1921 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1919, 1921 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.16/self_attn/Concat_4_output_0", "outputIndexes": +[ 1922 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1922, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Mul_3_output_0", "outputIndexes": +[ 1923 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1903, 1923 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/self_attn/Add_1_output_0", "outputIndexes": +[ 1924 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3417 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 269962700, 147478, 36864, 0, 0 ] + } +, "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": +[ 3426 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3426 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3427 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3427 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 1925 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1860, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 1926 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1868, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.16/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 1927 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1926, 1927, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.16/self_attn/Concat_2_output_0", "outputIndexes": +[ 1928 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1925, 1928 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.16/self_attn/Reshape_2_output_0", "outputIndexes": +[ 1929 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7263", "outputIndexes": +[ 1930 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7266", "outputIndexes": +[ 1931 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 1930, 1931, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7269", "outputIndexes": +[ 1932 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1932 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7270", "outputIndexes": +[ 1933 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1933 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7271", "outputIndexes": +[ 1934 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1934, 1933 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7272", "outputIndexes": +[ 1935 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 1935, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_33_output_0", "outputIndexes": +[ 1936 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1895, 1924, 1929, 1936 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.16/self_attn/Reshape_7_output_0", "outputIndexes": +[ 1937 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1937 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3428 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3428 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3429 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3429 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 270147042, 589846, 147456, 0, 0 ] + } +, "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": +[ 3430 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3430 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3431 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3431 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 1938 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1938 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 270884344, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.16/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 1940 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1847, 1940 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/Add_output_0", "outputIndexes": +[ 1941 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1941 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 270893560, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.16/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1942 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1942 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3432 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3432 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3433 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3433 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 270902776, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": +[ 3434 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3434 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3435 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3435 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 1943 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1943 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.16/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 1944 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1943, 1944 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 1945 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 1945 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 1946 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1943, 1946 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Add_output_0", "outputIndexes": +[ 1947 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 1947 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 1948 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1948 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.16/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 1949 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 1949 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 1950 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1943, 1950 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 1951 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 1951 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 1952 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3433 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 275879438, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": +[ 3438 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3438 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3439 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3439 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 1953 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1952, 1953 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/mlp/Mul_output_0", "outputIndexes": +[ 1954 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1954 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3440 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3440 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3441 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3441 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 280856100, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": +[ 3442 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3442 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3443 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3443 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 1955 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1955 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 285832762, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.16/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 1957 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1941, 1957 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.16/Add_1_output_0", "outputIndexes": +[ 1958 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1958, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/Reshape_output_0", "outputIndexes": +[ 1959 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1959 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 285841978, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.17/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 1960 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1960 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3444 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3444 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3445 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3445 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 285851194, 589846, 147456, 0, 0 ] + } +, "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": +[ 3446 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3446 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3447 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3447 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 1961 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1960 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_output_0", "outputIndexes": +[ 1962 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1962 ] +, "main_type": "NONE", "name": "Shape7423", "outputIndexes": +[ 1963 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1962 ] +, "main_type": "NONE", "name": "Rank7425", "outputIndexes": +[ 1964 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1964, 1964 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7427", "outputIndexes": +[ 1965 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1965 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7428", "outputIndexes": +[ 1966 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1965, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7430", "outputIndexes": +[ 1967 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1967 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7431", "outputIndexes": +[ 1968 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1963, 1966, 1968, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7434", "outputIndexes": +[ 1969 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1969 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7435", "outputIndexes": +[ 1970 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1970, 1970 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7437", "outputIndexes": +[ 1971 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1962, 1971, 1965 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_output_0", "outputIndexes": +[ 1972 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1972, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 1973 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1965 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7445", "outputIndexes": +[ 1974 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1967 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7448", "outputIndexes": +[ 1975 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1963, 1974, 1975, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7451", "outputIndexes": +[ 1976 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1976 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7452", "outputIndexes": +[ 1977 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 1977 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7453", "outputIndexes": +[ 1978 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1978, 1977 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7454", "outputIndexes": +[ 1979 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1962, 1979, 1965 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_1_output_0", "outputIndexes": +[ 1980 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1980, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 1981 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1973, 1981, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_output_0", "outputIndexes": +[ 1982 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1961, 1982 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_output_0", "outputIndexes": +[ 1983 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1983 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 286588496, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.17/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 1985 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1985, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_output_0", "outputIndexes": +[ 1986 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1985 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_2_output_0", "outputIndexes": +[ 1987 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1987 ] +, "main_type": "NONE", "name": "Shape7572", "outputIndexes": +[ 1988 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 1987 ] +, "main_type": "NONE", "name": "Rank7574", "outputIndexes": +[ 1989 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1989, 1989 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7576", "outputIndexes": +[ 1990 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1990 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7577", "outputIndexes": +[ 1991 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1990, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7579", "outputIndexes": +[ 1992 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1992 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7580", "outputIndexes": +[ 1993 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1988, 1991, 1993, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7583", "outputIndexes": +[ 1994 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1994 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7584", "outputIndexes": +[ 1995 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 1995 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7585", "outputIndexes": +[ 1996 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1996, 1995 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7586", "outputIndexes": +[ 1997 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1987, 1997, 1990 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_2_output_0", "outputIndexes": +[ 1998 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1998, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Div_output_0", "outputIndexes": +[ 1999 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1999, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2000 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1985, 2000, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_1_output_0", "outputIndexes": +[ 2001 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2001 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.17/self_attn/Neg_output_0", "outputIndexes": +[ 2002 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1999, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2003 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1985, 24, 2003, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_output_0", "outputIndexes": +[ 2004 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2002, 2004 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.17/self_attn/Concat_3_output_0", "outputIndexes": +[ 2005 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2005, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_1_output_0", "outputIndexes": +[ 2006 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1986, 2006 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Add_output_0", "outputIndexes": +[ 2007 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3445 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 286590544, 147478, 36864, 0, 0 ] + } +, "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": +[ 3450 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3450 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3451 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3451 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2008 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1972, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2009 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1980, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2010 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2009, 2010, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_1_output_0", "outputIndexes": +[ 2011 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2008, 2011 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2012 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2012 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 286774886, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.17/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2014 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2014, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_2_output_0", "outputIndexes": +[ 2015 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2014 ] +, "main_type": "NONE", "name": "/blocks.17/self_attn/Shape_3_output_0", "outputIndexes": +[ 2016 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2016 ] +, "main_type": "NONE", "name": "Shape7470", "outputIndexes": +[ 2017 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2016 ] +, "main_type": "NONE", "name": "Rank7472", "outputIndexes": +[ 2018 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2018, 2018 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7474", "outputIndexes": +[ 2019 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2019 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7475", "outputIndexes": +[ 2020 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2019, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7477", "outputIndexes": +[ 2021 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2021 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7478", "outputIndexes": +[ 2022 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2017, 2020, 2022, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7481", "outputIndexes": +[ 2023 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2023 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7482", "outputIndexes": +[ 2024 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2024 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7483", "outputIndexes": +[ 2025 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2025, 2024 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7484", "outputIndexes": +[ 2026 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2016, 2026, 2019 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.17/self_attn/Gather_3_output_0", "outputIndexes": +[ 2027 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2027, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Div_1_output_0", "outputIndexes": +[ 2028 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2029 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2014, 2029, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_3_output_0", "outputIndexes": +[ 2030 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2030 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.17/self_attn/Neg_1_output_0", "outputIndexes": +[ 2031 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2028, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2032 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2014, 24, 2032, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.17/self_attn/Slice_2_output_0", "outputIndexes": +[ 2033 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2031, 2033 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.17/self_attn/Concat_4_output_0", "outputIndexes": +[ 2034 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2034, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Mul_3_output_0", "outputIndexes": +[ 2035 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2015, 2035 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/self_attn/Add_1_output_0", "outputIndexes": +[ 2036 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3445 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 286776934, 147478, 36864, 0, 0 ] + } +, "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": +[ 3454 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3454 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3455 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3455 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2037 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1972, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2038 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1980, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.17/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2039 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2038, 2039, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.17/self_attn/Concat_2_output_0", "outputIndexes": +[ 2040 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2037, 2040 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.17/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2041 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7693", "outputIndexes": +[ 2042 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7696", "outputIndexes": +[ 2043 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2042, 2043, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7699", "outputIndexes": +[ 2044 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2044 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7700", "outputIndexes": +[ 2045 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2045, 2045 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7702", "outputIndexes": +[ 2046 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2046, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_35_output_0", "outputIndexes": +[ 2047 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2007, 2036, 2041, 2047 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.17/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2048 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2048 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3456 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3456 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3457 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3457 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 286961276, 589846, 147456, 0, 0 ] + } +, "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": +[ 3458 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3458 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3459 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3459 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2049 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2049 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 287698578, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.17/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2051 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 1959, 2051 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/Add_output_0", "outputIndexes": +[ 2052 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2052 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 287707794, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.17/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2053 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2053 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3460 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3460 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3461 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3461 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 287717010, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": +[ 3462 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3462 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3463 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3463 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2054 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2054 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.17/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2055 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2054, 2055 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2056 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2056 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2057 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2054, 2057 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2058 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2058 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2059 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2059 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.17/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2060 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2060 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2061 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2054, 2061 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2062 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2062 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2063 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3461 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 292693672, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": +[ 3466 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3466 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3467 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3467 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2064 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2063, 2064 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/mlp/Mul_output_0", "outputIndexes": +[ 2065 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2065 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3468 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3468 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3469 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3469 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 297670334, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": +[ 3470 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3470 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3471 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3471 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2066 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2066 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 302646996, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.17/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2068 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2052, 2068 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.17/Add_1_output_0", "outputIndexes": +[ 2069 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2069, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/Reshape_output_0", "outputIndexes": +[ 2070 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2070 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 302656212, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.18/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2071 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2071 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3472 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3472 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3473 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3473 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 302665428, 589846, 147456, 0, 0 ] + } +, "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": +[ 3474 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3474 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3475 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3475 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2072 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2071 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_output_0", "outputIndexes": +[ 2073 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2073 ] +, "main_type": "NONE", "name": "Shape7853", "outputIndexes": +[ 2074 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2073 ] +, "main_type": "NONE", "name": "Rank7855", "outputIndexes": +[ 2075 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2075, 2075 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7857", "outputIndexes": +[ 2076 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2076 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7858", "outputIndexes": +[ 2077 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2076, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7860", "outputIndexes": +[ 2078 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2078 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7861", "outputIndexes": +[ 2079 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2074, 2077, 2079, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7864", "outputIndexes": +[ 2080 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2080 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7865", "outputIndexes": +[ 2081 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2081, 2081 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7867", "outputIndexes": +[ 2082 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2073, 2082, 2076 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_output_0", "outputIndexes": +[ 2083 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2083, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2084 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2076 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7875", "outputIndexes": +[ 2085 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2078 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7878", "outputIndexes": +[ 2086 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2074, 2085, 2086, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7881", "outputIndexes": +[ 2087 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2087 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7882", "outputIndexes": +[ 2088 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2088 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7883", "outputIndexes": +[ 2089 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2089, 2088 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7884", "outputIndexes": +[ 2090 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2073, 2090, 2076 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_1_output_0", "outputIndexes": +[ 2091 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2091, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2092 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2084, 2092, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_output_0", "outputIndexes": +[ 2093 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2072, 2093 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_output_0", "outputIndexes": +[ 2094 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2094 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 303402730, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.18/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2096 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_output_0", "outputIndexes": +[ 2097 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_2_output_0", "outputIndexes": +[ 2098 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2098 ] +, "main_type": "NONE", "name": "Shape8002", "outputIndexes": +[ 2099 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2098 ] +, "main_type": "NONE", "name": "Rank8004", "outputIndexes": +[ 2100 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2100, 2100 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8006", "outputIndexes": +[ 2101 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2101 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8007", "outputIndexes": +[ 2102 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2101, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8009", "outputIndexes": +[ 2103 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2103 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8010", "outputIndexes": +[ 2104 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2099, 2102, 2104, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8013", "outputIndexes": +[ 2105 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2105 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8014", "outputIndexes": +[ 2106 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2106 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8015", "outputIndexes": +[ 2107 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2107, 2106 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8016", "outputIndexes": +[ 2108 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2098, 2108, 2101 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_2_output_0", "outputIndexes": +[ 2109 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2109, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Div_output_0", "outputIndexes": +[ 2110 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2110, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2111 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096, 2111, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_1_output_0", "outputIndexes": +[ 2112 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2112 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.18/self_attn/Neg_output_0", "outputIndexes": +[ 2113 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2110, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2114 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2096, 24, 2114, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_output_0", "outputIndexes": +[ 2115 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2113, 2115 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.18/self_attn/Concat_3_output_0", "outputIndexes": +[ 2116 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2116, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_1_output_0", "outputIndexes": +[ 2117 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2097, 2117 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Add_output_0", "outputIndexes": +[ 2118 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3473 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 303404778, 147478, 36864, 0, 0 ] + } +, "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": +[ 3478 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3478 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3479 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3479 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2119 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2083, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2120 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2091, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2121 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2120, 2121, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_1_output_0", "outputIndexes": +[ 2122 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2119, 2122 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2123 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2123 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 303589120, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.18/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2125 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2125, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_2_output_0", "outputIndexes": +[ 2126 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2125 ] +, "main_type": "NONE", "name": "/blocks.18/self_attn/Shape_3_output_0", "outputIndexes": +[ 2127 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2127 ] +, "main_type": "NONE", "name": "Shape7900", "outputIndexes": +[ 2128 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2127 ] +, "main_type": "NONE", "name": "Rank7902", "outputIndexes": +[ 2129 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2129, 2129 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7904", "outputIndexes": +[ 2130 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2130 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7905", "outputIndexes": +[ 2131 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2130, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7907", "outputIndexes": +[ 2132 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2132 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze7908", "outputIndexes": +[ 2133 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2128, 2131, 2133, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice7911", "outputIndexes": +[ 2134 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2134 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze7912", "outputIndexes": +[ 2135 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2135 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7913", "outputIndexes": +[ 2136 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2136, 2135 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp7914", "outputIndexes": +[ 2137 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2127, 2137, 2130 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.18/self_attn/Gather_3_output_0", "outputIndexes": +[ 2138 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2138, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Div_1_output_0", "outputIndexes": +[ 2139 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2139, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2140 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2125, 2140, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_3_output_0", "outputIndexes": +[ 2141 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2141 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.18/self_attn/Neg_1_output_0", "outputIndexes": +[ 2142 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2139, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2143 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2125, 24, 2143, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.18/self_attn/Slice_2_output_0", "outputIndexes": +[ 2144 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2142, 2144 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.18/self_attn/Concat_4_output_0", "outputIndexes": +[ 2145 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2145, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Mul_3_output_0", "outputIndexes": +[ 2146 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2126, 2146 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/self_attn/Add_1_output_0", "outputIndexes": +[ 2147 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3473 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 303591168, 147478, 36864, 0, 0 ] + } +, "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": +[ 3482 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3482 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3483 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3483 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2148 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2083, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2149 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2091, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.18/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2150 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2149, 2150, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.18/self_attn/Concat_2_output_0", "outputIndexes": +[ 2151 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2148, 2151 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.18/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2152 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8123", "outputIndexes": +[ 2153 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8126", "outputIndexes": +[ 2154 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2153, 2154, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8129", "outputIndexes": +[ 2155 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2155 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8130", "outputIndexes": +[ 2156 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2156 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8131", "outputIndexes": +[ 2157 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2157, 2156 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8132", "outputIndexes": +[ 2158 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2158, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_37_output_0", "outputIndexes": +[ 2159 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2118, 2147, 2152, 2159 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.18/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2160 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2160 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3484 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3484 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3485 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3485 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 303775510, 589846, 147456, 0, 0 ] + } +, "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": +[ 3486 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3486 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3487 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3487 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2161 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2161 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 304512812, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.18/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2163 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2070, 2163 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/Add_output_0", "outputIndexes": +[ 2164 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2164 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 304522028, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.18/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2165 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2165 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3488 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3488 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3489 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3489 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 304531244, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": +[ 3490 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3490 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3491 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3491 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2166 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2166 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.18/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2167 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2166, 2167 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2168 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2168 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2169 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2166, 2169 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2170 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2170 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2171 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2171 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.18/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2172 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2172 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2173 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2166, 2173 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2174 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2174 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2175 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3489 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 309507906, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": +[ 3494 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3494 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3495 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3495 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2176 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2175, 2176 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/mlp/Mul_output_0", "outputIndexes": +[ 2177 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2177 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3496 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3496 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3497 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3497 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 314484568, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": +[ 3498 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3498 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3499 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3499 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2178 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2178 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 319461230, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.18/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2180 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2164, 2180 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.18/Add_1_output_0", "outputIndexes": +[ 2181 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2181, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/Reshape_output_0", "outputIndexes": +[ 2182 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2182 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 319470446, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.19/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2183 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2183 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3500 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3500 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3501 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3501 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 319479662, 589846, 147456, 0, 0 ] + } +, "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": +[ 3502 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3502 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3503 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3503 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2184 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2183 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_output_0", "outputIndexes": +[ 2185 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2185 ] +, "main_type": "NONE", "name": "Shape8283", "outputIndexes": +[ 2186 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2185 ] +, "main_type": "NONE", "name": "Rank8285", "outputIndexes": +[ 2187 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2187, 2187 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8287", "outputIndexes": +[ 2188 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8288", "outputIndexes": +[ 2189 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8290", "outputIndexes": +[ 2190 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2190 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8291", "outputIndexes": +[ 2191 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2186, 2189, 2191, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8294", "outputIndexes": +[ 2192 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2192 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8295", "outputIndexes": +[ 2193 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2193, 2193 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8297", "outputIndexes": +[ 2194 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2185, 2194, 2188 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_output_0", "outputIndexes": +[ 2195 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2196 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2188 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8305", "outputIndexes": +[ 2197 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2190 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8308", "outputIndexes": +[ 2198 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2186, 2197, 2198, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8311", "outputIndexes": +[ 2199 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2199 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8312", "outputIndexes": +[ 2200 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2200 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8313", "outputIndexes": +[ 2201 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2201, 2200 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8314", "outputIndexes": +[ 2202 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2185, 2202, 2188 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_1_output_0", "outputIndexes": +[ 2203 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2204 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2196, 2204, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_output_0", "outputIndexes": +[ 2205 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2184, 2205 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_output_0", "outputIndexes": +[ 2206 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2206 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 320216964, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.19/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2208 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2208, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_output_0", "outputIndexes": +[ 2209 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2208 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_2_output_0", "outputIndexes": +[ 2210 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2210 ] +, "main_type": "NONE", "name": "Shape8432", "outputIndexes": +[ 2211 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2210 ] +, "main_type": "NONE", "name": "Rank8434", "outputIndexes": +[ 2212 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2212, 2212 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8436", "outputIndexes": +[ 2213 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2213 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8437", "outputIndexes": +[ 2214 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2213, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8439", "outputIndexes": +[ 2215 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2215 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8440", "outputIndexes": +[ 2216 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2211, 2214, 2216, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8443", "outputIndexes": +[ 2217 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2217 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8444", "outputIndexes": +[ 2218 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2218 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8445", "outputIndexes": +[ 2219 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2219, 2218 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8446", "outputIndexes": +[ 2220 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2210, 2220, 2213 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_2_output_0", "outputIndexes": +[ 2221 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2221, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Div_output_0", "outputIndexes": +[ 2222 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2222, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2223 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2208, 2223, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_1_output_0", "outputIndexes": +[ 2224 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2224 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.19/self_attn/Neg_output_0", "outputIndexes": +[ 2225 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2222, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2226 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2208, 24, 2226, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_output_0", "outputIndexes": +[ 2227 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2225, 2227 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.19/self_attn/Concat_3_output_0", "outputIndexes": +[ 2228 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2228, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_1_output_0", "outputIndexes": +[ 2229 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2209, 2229 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Add_output_0", "outputIndexes": +[ 2230 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3501 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 320219012, 147478, 36864, 0, 0 ] + } +, "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": +[ 3506 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3506 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3507 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3507 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2231 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2232 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2233 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2232, 2233, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_1_output_0", "outputIndexes": +[ 2234 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2231, 2234 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2235 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2235 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 320403354, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.19/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2237 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2237, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_2_output_0", "outputIndexes": +[ 2238 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2237 ] +, "main_type": "NONE", "name": "/blocks.19/self_attn/Shape_3_output_0", "outputIndexes": +[ 2239 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2239 ] +, "main_type": "NONE", "name": "Shape8330", "outputIndexes": +[ 2240 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2239 ] +, "main_type": "NONE", "name": "Rank8332", "outputIndexes": +[ 2241 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2241, 2241 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8334", "outputIndexes": +[ 2242 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2242 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8335", "outputIndexes": +[ 2243 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2242, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8337", "outputIndexes": +[ 2244 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2244 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8338", "outputIndexes": +[ 2245 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2240, 2243, 2245, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8341", "outputIndexes": +[ 2246 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2246 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8342", "outputIndexes": +[ 2247 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2247 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8343", "outputIndexes": +[ 2248 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2248, 2247 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8344", "outputIndexes": +[ 2249 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2239, 2249, 2242 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.19/self_attn/Gather_3_output_0", "outputIndexes": +[ 2250 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2250, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Div_1_output_0", "outputIndexes": +[ 2251 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2251, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2252 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2237, 2252, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_3_output_0", "outputIndexes": +[ 2253 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2253 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.19/self_attn/Neg_1_output_0", "outputIndexes": +[ 2254 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2251, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2255 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2237, 24, 2255, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.19/self_attn/Slice_2_output_0", "outputIndexes": +[ 2256 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2254, 2256 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.19/self_attn/Concat_4_output_0", "outputIndexes": +[ 2257 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2257, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Mul_3_output_0", "outputIndexes": +[ 2258 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2238, 2258 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/self_attn/Add_1_output_0", "outputIndexes": +[ 2259 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3501 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 320405402, 147478, 36864, 0, 0 ] + } +, "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": +[ 3510 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3510 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3511 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3511 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2260 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2195, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2261 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2203, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.19/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2262 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2261, 2262, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.19/self_attn/Concat_2_output_0", "outputIndexes": +[ 2263 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2260, 2263 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.19/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2264 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8553", "outputIndexes": +[ 2265 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8556", "outputIndexes": +[ 2266 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2265, 2266, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8559", "outputIndexes": +[ 2267 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2267 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8560", "outputIndexes": +[ 2268 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2268 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8561", "outputIndexes": +[ 2269 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2269, 2268 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8562", "outputIndexes": +[ 2270 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2270, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_39_output_0", "outputIndexes": +[ 2271 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2230, 2259, 2264, 2271 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.19/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2272 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2272 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3512 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3512 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3513 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3513 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 320589744, 589846, 147456, 0, 0 ] + } +, "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": +[ 3514 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3514 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3515 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3515 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2273 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2273 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 321327046, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.19/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2275 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2182, 2275 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/Add_output_0", "outputIndexes": +[ 2276 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2276 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 321336262, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.19/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2277 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2277 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3516 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3516 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3517 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3517 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 321345478, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": +[ 3518 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3518 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3519 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3519 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2278 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2278 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.19/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2279 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2278, 2279 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2280 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2280 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2281 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2278, 2281 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2282 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2282 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2283 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2283 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.19/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2284 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2284 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2285 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2278, 2285 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2286 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2286 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2287 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3517 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 326322140, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": +[ 3522 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3522 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3523 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3523 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2288 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2287, 2288 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/mlp/Mul_output_0", "outputIndexes": +[ 2289 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2289 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3524 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3524 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3525 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3525 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 331298802, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": +[ 3526 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3526 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3527 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3527 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2290 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2290 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 336275464, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.19/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2292 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2276, 2292 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.19/Add_1_output_0", "outputIndexes": +[ 2293 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2293, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/Reshape_output_0", "outputIndexes": +[ 2294 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2294 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 336284680, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.20/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2295 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3528 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3528 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3529 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3529 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 336293896, 589846, 147456, 0, 0 ] + } +, "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": +[ 3530 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3530 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3531 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3531 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2296 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2295 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_output_0", "outputIndexes": +[ 2297 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2297 ] +, "main_type": "NONE", "name": "Shape8713", "outputIndexes": +[ 2298 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2297 ] +, "main_type": "NONE", "name": "Rank8715", "outputIndexes": +[ 2299 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2299, 2299 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8717", "outputIndexes": +[ 2300 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2300 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8718", "outputIndexes": +[ 2301 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2300, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8720", "outputIndexes": +[ 2302 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2302 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8721", "outputIndexes": +[ 2303 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2298, 2301, 2303, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8724", "outputIndexes": +[ 2304 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2304 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8725", "outputIndexes": +[ 2305 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2305, 2305 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8727", "outputIndexes": +[ 2306 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2297, 2306, 2300 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_output_0", "outputIndexes": +[ 2307 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2307, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2308 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2300 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8735", "outputIndexes": +[ 2309 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2302 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8738", "outputIndexes": +[ 2310 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2298, 2309, 2310, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8741", "outputIndexes": +[ 2311 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2311 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8742", "outputIndexes": +[ 2312 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2312 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8743", "outputIndexes": +[ 2313 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2313, 2312 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8744", "outputIndexes": +[ 2314 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2297, 2314, 2300 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_1_output_0", "outputIndexes": +[ 2315 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2315, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2316 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2308, 2316, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_output_0", "outputIndexes": +[ 2317 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2296, 2317 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_output_0", "outputIndexes": +[ 2318 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2318 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 337031198, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.20/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2320 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2320, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_output_0", "outputIndexes": +[ 2321 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2320 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_2_output_0", "outputIndexes": +[ 2322 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2322 ] +, "main_type": "NONE", "name": "Shape8862", "outputIndexes": +[ 2323 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2322 ] +, "main_type": "NONE", "name": "Rank8864", "outputIndexes": +[ 2324 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2324, 2324 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8866", "outputIndexes": +[ 2325 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2325 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8867", "outputIndexes": +[ 2326 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2325, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8869", "outputIndexes": +[ 2327 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2327 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8870", "outputIndexes": +[ 2328 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2323, 2326, 2328, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8873", "outputIndexes": +[ 2329 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2329 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8874", "outputIndexes": +[ 2330 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2330 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8875", "outputIndexes": +[ 2331 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2331, 2330 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8876", "outputIndexes": +[ 2332 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2322, 2332, 2325 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_2_output_0", "outputIndexes": +[ 2333 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2333, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Div_output_0", "outputIndexes": +[ 2334 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2334, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2335 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2320, 2335, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_1_output_0", "outputIndexes": +[ 2336 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2336 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.20/self_attn/Neg_output_0", "outputIndexes": +[ 2337 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2334, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2338 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2320, 24, 2338, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_output_0", "outputIndexes": +[ 2339 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2337, 2339 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.20/self_attn/Concat_3_output_0", "outputIndexes": +[ 2340 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2340, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_1_output_0", "outputIndexes": +[ 2341 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2321, 2341 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Add_output_0", "outputIndexes": +[ 2342 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3529 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 337033246, 147478, 36864, 0, 0 ] + } +, "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": +[ 3534 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3534 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3535 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3535 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2343 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2307, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2344 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2315, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2345 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2344, 2345, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_1_output_0", "outputIndexes": +[ 2346 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2343, 2346 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2347 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2347 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 337217588, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.20/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2349 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2349, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_2_output_0", "outputIndexes": +[ 2350 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2349 ] +, "main_type": "NONE", "name": "/blocks.20/self_attn/Shape_3_output_0", "outputIndexes": +[ 2351 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2351 ] +, "main_type": "NONE", "name": "Shape8760", "outputIndexes": +[ 2352 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2351 ] +, "main_type": "NONE", "name": "Rank8762", "outputIndexes": +[ 2353 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2353, 2353 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8764", "outputIndexes": +[ 2354 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2354 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8765", "outputIndexes": +[ 2355 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2354, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8767", "outputIndexes": +[ 2356 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2356 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8768", "outputIndexes": +[ 2357 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2352, 2355, 2357, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8771", "outputIndexes": +[ 2358 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2358 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8772", "outputIndexes": +[ 2359 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2359 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8773", "outputIndexes": +[ 2360 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2360, 2359 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8774", "outputIndexes": +[ 2361 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2351, 2361, 2354 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.20/self_attn/Gather_3_output_0", "outputIndexes": +[ 2362 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2362, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Div_1_output_0", "outputIndexes": +[ 2363 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2363, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2364 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2349, 2364, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_3_output_0", "outputIndexes": +[ 2365 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2365 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.20/self_attn/Neg_1_output_0", "outputIndexes": +[ 2366 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2363, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2367 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2349, 24, 2367, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.20/self_attn/Slice_2_output_0", "outputIndexes": +[ 2368 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2366, 2368 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.20/self_attn/Concat_4_output_0", "outputIndexes": +[ 2369 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2369, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Mul_3_output_0", "outputIndexes": +[ 2370 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2350, 2370 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/self_attn/Add_1_output_0", "outputIndexes": +[ 2371 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3529 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 337219636, 147478, 36864, 0, 0 ] + } +, "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": +[ 3538 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3538 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3539 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3539 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2372 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2307, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2373 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2315, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.20/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2374 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2373, 2374, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.20/self_attn/Concat_2_output_0", "outputIndexes": +[ 2375 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2372, 2375 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.20/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2376 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8983", "outputIndexes": +[ 2377 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze8986", "outputIndexes": +[ 2378 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2377, 2378, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice8989", "outputIndexes": +[ 2379 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2379 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze8990", "outputIndexes": +[ 2380 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2380 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8991", "outputIndexes": +[ 2381 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2381, 2380 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp8992", "outputIndexes": +[ 2382 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2382, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_41_output_0", "outputIndexes": +[ 2383 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2342, 2371, 2376, 2383 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.20/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2384 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2384 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3540 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3540 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3541 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3541 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 337403978, 589846, 147456, 0, 0 ] + } +, "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": +[ 3542 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3542 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3543 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3543 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2385 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2385 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 338141280, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.20/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2387 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2294, 2387 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/Add_output_0", "outputIndexes": +[ 2388 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2388 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 338150496, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.20/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2389 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2389 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3544 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3544 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3545 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3545 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 338159712, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": +[ 3546 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3546 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3547 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3547 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2390 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2390 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.20/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2391 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2390, 2391 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2392 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2392 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2393 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2390, 2393 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2394 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2394 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2395 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2395 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.20/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2396 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2396 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2397 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2390, 2397 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2398 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2398 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2399 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3545 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 343136374, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": +[ 3550 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3550 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3551 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3551 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2400 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2399, 2400 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/mlp/Mul_output_0", "outputIndexes": +[ 2401 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2401 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3552 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3552 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3553 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3553 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 348113036, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": +[ 3554 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3554 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3555 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3555 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2402 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2402 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 353089698, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.20/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2404 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2388, 2404 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.20/Add_1_output_0", "outputIndexes": +[ 2405 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2405, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/Reshape_output_0", "outputIndexes": +[ 2406 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2406 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 353098914, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.21/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2407 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2407 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3556 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3556 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3557 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3557 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 353108130, 589846, 147456, 0, 0 ] + } +, "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": +[ 3558 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3558 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3559 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3559 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2408 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2407 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_output_0", "outputIndexes": +[ 2409 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2409 ] +, "main_type": "NONE", "name": "Shape9143", "outputIndexes": +[ 2410 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2409 ] +, "main_type": "NONE", "name": "Rank9145", "outputIndexes": +[ 2411 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2411, 2411 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9147", "outputIndexes": +[ 2412 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2412 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9148", "outputIndexes": +[ 2413 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2412, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9150", "outputIndexes": +[ 2414 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2414 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9151", "outputIndexes": +[ 2415 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2410, 2413, 2415, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9154", "outputIndexes": +[ 2416 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2416 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9155", "outputIndexes": +[ 2417 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2417, 2417 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9157", "outputIndexes": +[ 2418 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2409, 2418, 2412 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_output_0", "outputIndexes": +[ 2419 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2419, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2420 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2412 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9165", "outputIndexes": +[ 2421 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2414 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9168", "outputIndexes": +[ 2422 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2410, 2421, 2422, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9171", "outputIndexes": +[ 2423 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2423 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9172", "outputIndexes": +[ 2424 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2424 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9173", "outputIndexes": +[ 2425 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2425, 2424 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9174", "outputIndexes": +[ 2426 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2409, 2426, 2412 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_1_output_0", "outputIndexes": +[ 2427 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2427, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2428 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2420, 2428, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_output_0", "outputIndexes": +[ 2429 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2408, 2429 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_output_0", "outputIndexes": +[ 2430 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2430 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 353845432, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.21/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2432 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2432, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_output_0", "outputIndexes": +[ 2433 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2432 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_2_output_0", "outputIndexes": +[ 2434 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2434 ] +, "main_type": "NONE", "name": "Shape9292", "outputIndexes": +[ 2435 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2434 ] +, "main_type": "NONE", "name": "Rank9294", "outputIndexes": +[ 2436 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2436, 2436 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9296", "outputIndexes": +[ 2437 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2437 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9297", "outputIndexes": +[ 2438 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2437, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9299", "outputIndexes": +[ 2439 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2439 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9300", "outputIndexes": +[ 2440 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2435, 2438, 2440, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9303", "outputIndexes": +[ 2441 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2441 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9304", "outputIndexes": +[ 2442 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2442 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9305", "outputIndexes": +[ 2443 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2443, 2442 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9306", "outputIndexes": +[ 2444 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2434, 2444, 2437 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_2_output_0", "outputIndexes": +[ 2445 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2445, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Div_output_0", "outputIndexes": +[ 2446 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2446, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2447 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2432, 2447, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_1_output_0", "outputIndexes": +[ 2448 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2448 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.21/self_attn/Neg_output_0", "outputIndexes": +[ 2449 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2446, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2450 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2432, 24, 2450, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_output_0", "outputIndexes": +[ 2451 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2449, 2451 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.21/self_attn/Concat_3_output_0", "outputIndexes": +[ 2452 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2452, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_1_output_0", "outputIndexes": +[ 2453 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2433, 2453 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Add_output_0", "outputIndexes": +[ 2454 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3557 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 353847480, 147478, 36864, 0, 0 ] + } +, "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": +[ 3562 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3562 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3563 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3563 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2455 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2419, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2456 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2427, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2457 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2456, 2457, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_1_output_0", "outputIndexes": +[ 2458 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2455, 2458 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2459 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2459 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 354031822, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.21/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2461 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2461, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_2_output_0", "outputIndexes": +[ 2462 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2461 ] +, "main_type": "NONE", "name": "/blocks.21/self_attn/Shape_3_output_0", "outputIndexes": +[ 2463 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2463 ] +, "main_type": "NONE", "name": "Shape9190", "outputIndexes": +[ 2464 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2463 ] +, "main_type": "NONE", "name": "Rank9192", "outputIndexes": +[ 2465 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2465, 2465 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9194", "outputIndexes": +[ 2466 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2466 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9195", "outputIndexes": +[ 2467 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2466, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9197", "outputIndexes": +[ 2468 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2468 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9198", "outputIndexes": +[ 2469 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2464, 2467, 2469, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9201", "outputIndexes": +[ 2470 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2470 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9202", "outputIndexes": +[ 2471 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2471 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9203", "outputIndexes": +[ 2472 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2472, 2471 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9204", "outputIndexes": +[ 2473 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2463, 2473, 2466 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.21/self_attn/Gather_3_output_0", "outputIndexes": +[ 2474 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2474, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Div_1_output_0", "outputIndexes": +[ 2475 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2475, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2476 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2461, 2476, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_3_output_0", "outputIndexes": +[ 2477 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2477 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.21/self_attn/Neg_1_output_0", "outputIndexes": +[ 2478 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2475, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2479 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2461, 24, 2479, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.21/self_attn/Slice_2_output_0", "outputIndexes": +[ 2480 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2478, 2480 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.21/self_attn/Concat_4_output_0", "outputIndexes": +[ 2481 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2481, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Mul_3_output_0", "outputIndexes": +[ 2482 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2462, 2482 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/self_attn/Add_1_output_0", "outputIndexes": +[ 2483 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3557 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 354033870, 147478, 36864, 0, 0 ] + } +, "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": +[ 3566 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3566 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3567 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3567 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2484 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2419, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2485 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2427, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.21/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2486 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2485, 2486, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.21/self_attn/Concat_2_output_0", "outputIndexes": +[ 2487 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2484, 2487 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.21/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2488 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9413", "outputIndexes": +[ 2489 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9416", "outputIndexes": +[ 2490 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2489, 2490, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9419", "outputIndexes": +[ 2491 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2491 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9420", "outputIndexes": +[ 2492 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2492 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9421", "outputIndexes": +[ 2493 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2493, 2492 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9422", "outputIndexes": +[ 2494 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2494, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_43_output_0", "outputIndexes": +[ 2495 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2454, 2483, 2488, 2495 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.21/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2496 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2496 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3568 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3568 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3569 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3569 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 354218212, 589846, 147456, 0, 0 ] + } +, "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": +[ 3570 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3570 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3571 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3571 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2497 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2497 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 354955514, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.21/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2499 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2406, 2499 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/Add_output_0", "outputIndexes": +[ 2500 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 354964730, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.21/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2501 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2501 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3572 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3572 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3573 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3573 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 354973946, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": +[ 3574 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3574 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3575 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3575 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2502 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2502 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.21/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2503 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2502, 2503 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2504 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2504 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2505 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2502, 2505 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2506 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2506 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2507 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2507 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.21/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2508 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2508 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2509 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2502, 2509 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2510 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2510 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2511 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3573 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 359950608, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": +[ 3578 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3578 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3579 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3579 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2512 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2511, 2512 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/mlp/Mul_output_0", "outputIndexes": +[ 2513 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2513 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3580 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3580 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3581 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3581 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 364927270, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": +[ 3582 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3582 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3583 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3583 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2514 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2514 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 369903932, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.21/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2516 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2500, 2516 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.21/Add_1_output_0", "outputIndexes": +[ 2517 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2517, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/Reshape_output_0", "outputIndexes": +[ 2518 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2518 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 369913148, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.22/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2519 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2519 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3584 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3584 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3585 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3585 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 369922364, 589846, 147456, 0, 0 ] + } +, "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": +[ 3586 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3586 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3587 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3587 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2520 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2519 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_output_0", "outputIndexes": +[ 2521 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2521 ] +, "main_type": "NONE", "name": "Shape9573", "outputIndexes": +[ 2522 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2521 ] +, "main_type": "NONE", "name": "Rank9575", "outputIndexes": +[ 2523 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2523, 2523 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9577", "outputIndexes": +[ 2524 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2524 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9578", "outputIndexes": +[ 2525 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2524, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9580", "outputIndexes": +[ 2526 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2526 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9581", "outputIndexes": +[ 2527 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2522, 2525, 2527, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9584", "outputIndexes": +[ 2528 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2528 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9585", "outputIndexes": +[ 2529 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2529, 2529 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9587", "outputIndexes": +[ 2530 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2521, 2530, 2524 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_output_0", "outputIndexes": +[ 2531 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2531, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2532 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2524 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9595", "outputIndexes": +[ 2533 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2526 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9598", "outputIndexes": +[ 2534 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2522, 2533, 2534, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9601", "outputIndexes": +[ 2535 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2535 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9602", "outputIndexes": +[ 2536 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2536 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9603", "outputIndexes": +[ 2537 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2537, 2536 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9604", "outputIndexes": +[ 2538 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2521, 2538, 2524 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_1_output_0", "outputIndexes": +[ 2539 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2539, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2540 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2532, 2540, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_output_0", "outputIndexes": +[ 2541 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2520, 2541 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_output_0", "outputIndexes": +[ 2542 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2542 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 370659666, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.22/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2544 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_output_0", "outputIndexes": +[ 2545 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_2_output_0", "outputIndexes": +[ 2546 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2546 ] +, "main_type": "NONE", "name": "Shape9722", "outputIndexes": +[ 2547 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2546 ] +, "main_type": "NONE", "name": "Rank9724", "outputIndexes": +[ 2548 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2548, 2548 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9726", "outputIndexes": +[ 2549 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2549 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9727", "outputIndexes": +[ 2550 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2549, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9729", "outputIndexes": +[ 2551 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2551 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9730", "outputIndexes": +[ 2552 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2547, 2550, 2552, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9733", "outputIndexes": +[ 2553 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2553 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9734", "outputIndexes": +[ 2554 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2554 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9735", "outputIndexes": +[ 2555 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2555, 2554 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9736", "outputIndexes": +[ 2556 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2546, 2556, 2549 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_2_output_0", "outputIndexes": +[ 2557 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2557, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Div_output_0", "outputIndexes": +[ 2558 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2558, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2559 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544, 2559, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_1_output_0", "outputIndexes": +[ 2560 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2560 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.22/self_attn/Neg_output_0", "outputIndexes": +[ 2561 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2558, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2562 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2544, 24, 2562, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_output_0", "outputIndexes": +[ 2563 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2561, 2563 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.22/self_attn/Concat_3_output_0", "outputIndexes": +[ 2564 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2564, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_1_output_0", "outputIndexes": +[ 2565 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2545, 2565 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Add_output_0", "outputIndexes": +[ 2566 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3585 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 370661714, 147478, 36864, 0, 0 ] + } +, "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": +[ 3590 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3590 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3591 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3591 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2567 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2531, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2568 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2539, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2569 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2568, 2569, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_1_output_0", "outputIndexes": +[ 2570 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2567, 2570 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2571 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2571 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 370846056, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.22/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2573 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2573, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_2_output_0", "outputIndexes": +[ 2574 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2573 ] +, "main_type": "NONE", "name": "/blocks.22/self_attn/Shape_3_output_0", "outputIndexes": +[ 2575 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2575 ] +, "main_type": "NONE", "name": "Shape9620", "outputIndexes": +[ 2576 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2575 ] +, "main_type": "NONE", "name": "Rank9622", "outputIndexes": +[ 2577 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2577, 2577 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9624", "outputIndexes": +[ 2578 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2578 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9625", "outputIndexes": +[ 2579 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2578, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9627", "outputIndexes": +[ 2580 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2580 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9628", "outputIndexes": +[ 2581 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2576, 2579, 2581, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9631", "outputIndexes": +[ 2582 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2582 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9632", "outputIndexes": +[ 2583 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2583 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9633", "outputIndexes": +[ 2584 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2584, 2583 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9634", "outputIndexes": +[ 2585 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2575, 2585, 2578 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.22/self_attn/Gather_3_output_0", "outputIndexes": +[ 2586 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2586, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Div_1_output_0", "outputIndexes": +[ 2587 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2587, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2588 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2573, 2588, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_3_output_0", "outputIndexes": +[ 2589 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2589 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.22/self_attn/Neg_1_output_0", "outputIndexes": +[ 2590 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2587, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2591 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2573, 24, 2591, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.22/self_attn/Slice_2_output_0", "outputIndexes": +[ 2592 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2590, 2592 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.22/self_attn/Concat_4_output_0", "outputIndexes": +[ 2593 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2593, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Mul_3_output_0", "outputIndexes": +[ 2594 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2574, 2594 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/self_attn/Add_1_output_0", "outputIndexes": +[ 2595 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3585 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 370848104, 147478, 36864, 0, 0 ] + } +, "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": +[ 3594 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3594 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3595 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3595 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2596 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2531, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2597 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2539, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.22/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2598 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2597, 2598, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.22/self_attn/Concat_2_output_0", "outputIndexes": +[ 2599 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2596, 2599 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.22/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2600 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9843", "outputIndexes": +[ 2601 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze9846", "outputIndexes": +[ 2602 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2601, 2602, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice9849", "outputIndexes": +[ 2603 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2603 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze9850", "outputIndexes": +[ 2604 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2604 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9851", "outputIndexes": +[ 2605 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2605, 2604 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp9852", "outputIndexes": +[ 2606 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2606, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_45_output_0", "outputIndexes": +[ 2607 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2566, 2595, 2600, 2607 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.22/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2608 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2608 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3596 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3596 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3597 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3597 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 371032446, 589846, 147456, 0, 0 ] + } +, "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": +[ 3598 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3598 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3599 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3599 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2609 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2609 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 371769748, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.22/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2611 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2518, 2611 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/Add_output_0", "outputIndexes": +[ 2612 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2612 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 371778964, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.22/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2613 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2613 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3600 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3600 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3601 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3601 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 371788180, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": +[ 3602 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3602 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3603 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3603 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2614 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2614 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.22/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2615 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2614, 2615 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2616 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2616 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2617 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2614, 2617 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2618 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2618 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2619 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2619 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.22/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2620 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2620 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2621 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2614, 2621 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2622 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2622 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2623 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3601 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 376764842, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": +[ 3606 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3606 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3607 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3607 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2624 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2623, 2624 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/mlp/Mul_output_0", "outputIndexes": +[ 2625 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2625 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3608 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3608 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3609 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3609 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 381741504, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": +[ 3610 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3610 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3611 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3611 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2626 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2626 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 386718166, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.22/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2628 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2612, 2628 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.22/Add_1_output_0", "outputIndexes": +[ 2629 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2629, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/Reshape_output_0", "outputIndexes": +[ 2630 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2630 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 386727382, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.23/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2631 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2631 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3612 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3612 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3613 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3613 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 386736598, 589846, 147456, 0, 0 ] + } +, "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": +[ 3614 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3614 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3615 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3615 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2632 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2631 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_output_0", "outputIndexes": +[ 2633 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2633 ] +, "main_type": "NONE", "name": "Shape10003", "outputIndexes": +[ 2634 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2633 ] +, "main_type": "NONE", "name": "Rank10005", "outputIndexes": +[ 2635 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2635, 2635 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10007", "outputIndexes": +[ 2636 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2636 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10008", "outputIndexes": +[ 2637 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2636, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10010", "outputIndexes": +[ 2638 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2638 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10011", "outputIndexes": +[ 2639 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2634, 2637, 2639, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10014", "outputIndexes": +[ 2640 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2640 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10015", "outputIndexes": +[ 2641 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2641, 2641 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10017", "outputIndexes": +[ 2642 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2633, 2642, 2636 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_output_0", "outputIndexes": +[ 2643 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2643, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2644 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2636 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10025", "outputIndexes": +[ 2645 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2638 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10028", "outputIndexes": +[ 2646 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2634, 2645, 2646, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10031", "outputIndexes": +[ 2647 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2647 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10032", "outputIndexes": +[ 2648 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2648 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10033", "outputIndexes": +[ 2649 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2649, 2648 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10034", "outputIndexes": +[ 2650 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2633, 2650, 2636 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_1_output_0", "outputIndexes": +[ 2651 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2652 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2644, 2652, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_output_0", "outputIndexes": +[ 2653 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2632, 2653 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_output_0", "outputIndexes": +[ 2654 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2654 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 387473900, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.23/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2656 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_output_0", "outputIndexes": +[ 2657 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_2_output_0", "outputIndexes": +[ 2658 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2658 ] +, "main_type": "NONE", "name": "Shape10152", "outputIndexes": +[ 2659 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2658 ] +, "main_type": "NONE", "name": "Rank10154", "outputIndexes": +[ 2660 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2660, 2660 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10156", "outputIndexes": +[ 2661 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2661 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10157", "outputIndexes": +[ 2662 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2661, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10159", "outputIndexes": +[ 2663 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2663 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10160", "outputIndexes": +[ 2664 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2659, 2662, 2664, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10163", "outputIndexes": +[ 2665 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2665 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10164", "outputIndexes": +[ 2666 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2666 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10165", "outputIndexes": +[ 2667 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2667, 2666 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10166", "outputIndexes": +[ 2668 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2658, 2668, 2661 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_2_output_0", "outputIndexes": +[ 2669 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2669, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Div_output_0", "outputIndexes": +[ 2670 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2670, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2671 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656, 2671, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_1_output_0", "outputIndexes": +[ 2672 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2672 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.23/self_attn/Neg_output_0", "outputIndexes": +[ 2673 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2670, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2674 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2656, 24, 2674, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_output_0", "outputIndexes": +[ 2675 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2673, 2675 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.23/self_attn/Concat_3_output_0", "outputIndexes": +[ 2676 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2676, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_1_output_0", "outputIndexes": +[ 2677 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2657, 2677 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Add_output_0", "outputIndexes": +[ 2678 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3613 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 387475948, 147478, 36864, 0, 0 ] + } +, "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": +[ 3618 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3618 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3619 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3619 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2679 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2643, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2680 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2681 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2680, 2681, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_1_output_0", "outputIndexes": +[ 2682 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2679, 2682 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2683 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2683 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 387660290, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.23/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2685 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2685, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_2_output_0", "outputIndexes": +[ 2686 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2685 ] +, "main_type": "NONE", "name": "/blocks.23/self_attn/Shape_3_output_0", "outputIndexes": +[ 2687 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2687 ] +, "main_type": "NONE", "name": "Shape10050", "outputIndexes": +[ 2688 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2687 ] +, "main_type": "NONE", "name": "Rank10052", "outputIndexes": +[ 2689 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2689, 2689 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10054", "outputIndexes": +[ 2690 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2690 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10055", "outputIndexes": +[ 2691 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2690, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10057", "outputIndexes": +[ 2692 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2692 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10058", "outputIndexes": +[ 2693 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2688, 2691, 2693, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10061", "outputIndexes": +[ 2694 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2694 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10062", "outputIndexes": +[ 2695 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2695 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10063", "outputIndexes": +[ 2696 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2696, 2695 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10064", "outputIndexes": +[ 2697 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2687, 2697, 2690 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.23/self_attn/Gather_3_output_0", "outputIndexes": +[ 2698 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2698, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Div_1_output_0", "outputIndexes": +[ 2699 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2699, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2700 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2685, 2700, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_3_output_0", "outputIndexes": +[ 2701 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2701 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.23/self_attn/Neg_1_output_0", "outputIndexes": +[ 2702 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2699, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2703 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2685, 24, 2703, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.23/self_attn/Slice_2_output_0", "outputIndexes": +[ 2704 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2702, 2704 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.23/self_attn/Concat_4_output_0", "outputIndexes": +[ 2705 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2705, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Mul_3_output_0", "outputIndexes": +[ 2706 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2686, 2706 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/self_attn/Add_1_output_0", "outputIndexes": +[ 2707 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3613 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 387662338, 147478, 36864, 0, 0 ] + } +, "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": +[ 3622 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3622 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3623 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3623 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2708 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2643, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2709 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2651, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.23/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2710 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2709, 2710, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.23/self_attn/Concat_2_output_0", "outputIndexes": +[ 2711 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2708, 2711 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.23/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2712 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10273", "outputIndexes": +[ 2713 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10276", "outputIndexes": +[ 2714 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2713, 2714, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10279", "outputIndexes": +[ 2715 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2715 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10280", "outputIndexes": +[ 2716 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2716, 2716 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10282", "outputIndexes": +[ 2717 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2717, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_47_output_0", "outputIndexes": +[ 2718 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2678, 2707, 2712, 2718 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.23/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2719 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2719 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3624 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3624 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3625 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3625 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 387846680, 589846, 147456, 0, 0 ] + } +, "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": +[ 3626 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3626 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3627 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3627 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2720 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2720 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 388583982, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.23/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2722 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2630, 2722 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/Add_output_0", "outputIndexes": +[ 2723 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2723 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 388593198, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.23/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2724 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2724 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3628 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3628 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3629 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3629 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 388602414, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": +[ 3630 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3630 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3631 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3631 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2725 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2725 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.23/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2726 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2725, 2726 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2727 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2727 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2728 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2725, 2728 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2729 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2729 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2730 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2730 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.23/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2731 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2731 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2732 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2725, 2732 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2733 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2733 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2734 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3629 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 393579076, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": +[ 3634 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3634 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3635 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3635 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2735 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2734, 2735 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/mlp/Mul_output_0", "outputIndexes": +[ 2736 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2736 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3636 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3636 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3637 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3637 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 398555738, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": +[ 3638 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3638 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3639 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3639 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2737 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2737 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 403532400, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.23/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2739 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2723, 2739 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.23/Add_1_output_0", "outputIndexes": +[ 2740 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2740, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/Reshape_output_0", "outputIndexes": +[ 2741 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2741 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 403541616, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.24/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2742 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2742 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3640 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3640 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3641 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3641 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 403550832, 589846, 147456, 0, 0 ] + } +, "name": "/layers.24/self_attn/q_proj/Linear", "outputIndexes": +[ 3642 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3642 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3643 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3643 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2743 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2742 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_output_0", "outputIndexes": +[ 2744 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2744 ] +, "main_type": "NONE", "name": "Shape10433", "outputIndexes": +[ 2745 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2744 ] +, "main_type": "NONE", "name": "Rank10435", "outputIndexes": +[ 2746 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2746, 2746 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10437", "outputIndexes": +[ 2747 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2747 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10438", "outputIndexes": +[ 2748 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2747, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10440", "outputIndexes": +[ 2749 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2749 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10441", "outputIndexes": +[ 2750 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2745, 2748, 2750, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10444", "outputIndexes": +[ 2751 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2751 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10445", "outputIndexes": +[ 2752 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2752, 2752 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10447", "outputIndexes": +[ 2753 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2744, 2753, 2747 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_output_0", "outputIndexes": +[ 2754 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2754, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2755 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2747 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10455", "outputIndexes": +[ 2756 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2749 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10458", "outputIndexes": +[ 2757 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2745, 2756, 2757, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10461", "outputIndexes": +[ 2758 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2758 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10462", "outputIndexes": +[ 2759 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2759 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10463", "outputIndexes": +[ 2760 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2760, 2759 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10464", "outputIndexes": +[ 2761 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2744, 2761, 2747 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_1_output_0", "outputIndexes": +[ 2762 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2762, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2763 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2755, 2763, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_output_0", "outputIndexes": +[ 2764 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2743, 2764 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_output_0", "outputIndexes": +[ 2765 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2765 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 404288134, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.24/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2767 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_output_0", "outputIndexes": +[ 2768 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_2_output_0", "outputIndexes": +[ 2769 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2769 ] +, "main_type": "NONE", "name": "Shape10582", "outputIndexes": +[ 2770 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2769 ] +, "main_type": "NONE", "name": "Rank10584", "outputIndexes": +[ 2771 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2771, 2771 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10586", "outputIndexes": +[ 2772 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2772 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10587", "outputIndexes": +[ 2773 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2772, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10589", "outputIndexes": +[ 2774 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2774 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10590", "outputIndexes": +[ 2775 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2770, 2773, 2775, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10593", "outputIndexes": +[ 2776 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2776 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10594", "outputIndexes": +[ 2777 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2777 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10595", "outputIndexes": +[ 2778 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2778, 2777 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10596", "outputIndexes": +[ 2779 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2769, 2779, 2772 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_2_output_0", "outputIndexes": +[ 2780 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2780, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Div_output_0", "outputIndexes": +[ 2781 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2781, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2782 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 2782, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_1_output_0", "outputIndexes": +[ 2783 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2783 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.24/self_attn/Neg_output_0", "outputIndexes": +[ 2784 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2781, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2785 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2767, 24, 2785, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_output_0", "outputIndexes": +[ 2786 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2784, 2786 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.24/self_attn/Concat_3_output_0", "outputIndexes": +[ 2787 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2787, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_1_output_0", "outputIndexes": +[ 2788 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2768, 2788 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Add_output_0", "outputIndexes": +[ 2789 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3641 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 404290182, 147478, 36864, 0, 0 ] + } +, "name": "/layers.24/self_attn/k_proj/Linear", "outputIndexes": +[ 3646 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3646 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3647 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3647 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2790 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2754, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2791 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2762, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2792 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2791, 2792, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_1_output_0", "outputIndexes": +[ 2793 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2790, 2793 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2794 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2794 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 404474524, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.24/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2796 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2796, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_2_output_0", "outputIndexes": +[ 2797 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2796 ] +, "main_type": "NONE", "name": "/blocks.24/self_attn/Shape_3_output_0", "outputIndexes": +[ 2798 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2798 ] +, "main_type": "NONE", "name": "Shape10480", "outputIndexes": +[ 2799 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2798 ] +, "main_type": "NONE", "name": "Rank10482", "outputIndexes": +[ 2800 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2800, 2800 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10484", "outputIndexes": +[ 2801 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2801 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10485", "outputIndexes": +[ 2802 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2801, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10487", "outputIndexes": +[ 2803 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2803 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10488", "outputIndexes": +[ 2804 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2799, 2802, 2804, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10491", "outputIndexes": +[ 2805 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2805 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10492", "outputIndexes": +[ 2806 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2806 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10493", "outputIndexes": +[ 2807 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2807, 2806 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10494", "outputIndexes": +[ 2808 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2798, 2808, 2801 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.24/self_attn/Gather_3_output_0", "outputIndexes": +[ 2809 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2809, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Div_1_output_0", "outputIndexes": +[ 2810 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2810, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2811 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2796, 2811, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_3_output_0", "outputIndexes": +[ 2812 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2812 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.24/self_attn/Neg_1_output_0", "outputIndexes": +[ 2813 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2810, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2814 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2796, 24, 2814, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.24/self_attn/Slice_2_output_0", "outputIndexes": +[ 2815 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2813, 2815 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.24/self_attn/Concat_4_output_0", "outputIndexes": +[ 2816 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2816, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Mul_3_output_0", "outputIndexes": +[ 2817 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2797, 2817 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/self_attn/Add_1_output_0", "outputIndexes": +[ 2818 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3641 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 404476572, 147478, 36864, 0, 0 ] + } +, "name": "/layers.24/self_attn/v_proj/Linear", "outputIndexes": +[ 3650 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3650 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3651 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3651 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2819 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2754, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2820 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2762, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.24/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2821 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2820, 2821, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.24/self_attn/Concat_2_output_0", "outputIndexes": +[ 2822 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2819, 2822 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.24/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2823 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10703", "outputIndexes": +[ 2824 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10706", "outputIndexes": +[ 2825 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2824, 2825, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10709", "outputIndexes": +[ 2826 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2826 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10710", "outputIndexes": +[ 2827 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2827 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10711", "outputIndexes": +[ 2828 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2828, 2827 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10712", "outputIndexes": +[ 2829 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2829, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_49_output_0", "outputIndexes": +[ 2830 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2789, 2818, 2823, 2830 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.24/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2831 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2831 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3652 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3652 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3653 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3653 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 404660914, 589846, 147456, 0, 0 ] + } +, "name": "/layers.24/self_attn/o_proj/Linear", "outputIndexes": +[ 3654 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3654 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3655 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3655 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2832 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2832 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 405398216, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.24/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2834 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2741, 2834 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/Add_output_0", "outputIndexes": +[ 2835 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2835 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 405407432, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.24/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2836 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2836 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3656 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3656 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3657 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3657 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 405416648, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.24/mlp/gate_proj/Linear", "outputIndexes": +[ 3658 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3658 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3659 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3659 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2837 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2837 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.24/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2838 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2837, 2838 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2839 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2839 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2840 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2837, 2840 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2841 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2841 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2842 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2842 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.24/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2843 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2843 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2844 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2837, 2844 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2845 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2845 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2846 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3657 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 410393310, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.24/mlp/up_proj/Linear", "outputIndexes": +[ 3662 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3662 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3663 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3663 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2847 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2846, 2847 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/mlp/Mul_output_0", "outputIndexes": +[ 2848 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2848 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3664 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3664 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3665 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3665 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 415369972, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.24/mlp/down_proj/Linear", "outputIndexes": +[ 3666 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3666 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3667 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3667 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2849 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2849 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 420346634, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.24/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2851 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2835, 2851 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.24/Add_1_output_0", "outputIndexes": +[ 2852 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2852, 7 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/Reshape_output_0", "outputIndexes": +[ 2853 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2853 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 420355850, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.25/input_layernorm/Mul_1_output_0", "outputIndexes": +[ 2854 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2854 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": +[ 3668 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3668 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "outputIndexes": +[ 3669 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3669 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1024, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 420365066, 589846, 147456, 0, 0 ] + } +, "name": "/layers.25/self_attn/q_proj/Linear", "outputIndexes": +[ 3670 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3670 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "outputIndexes": +[ 3671 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3671 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1024 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "outputIndexes": +[ 2855 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2854 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_output_0", "outputIndexes": +[ 2856 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2856 ] +, "main_type": "NONE", "name": "Shape10863", "outputIndexes": +[ 2857 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2856 ] +, "main_type": "NONE", "name": "Rank10865", "outputIndexes": +[ 2858 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2858, 2858 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10867", "outputIndexes": +[ 2859 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2859 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10868", "outputIndexes": +[ 2860 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2859, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10870", "outputIndexes": +[ 2861 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2861 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10871", "outputIndexes": +[ 2862 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2857, 2860, 2862, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10874", "outputIndexes": +[ 2863 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2863 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10875", "outputIndexes": +[ 2864 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2864, 2864 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10877", "outputIndexes": +[ 2865 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856, 2865, 2859 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_output_0", "outputIndexes": +[ 2866 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2866, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_output_0", "outputIndexes": +[ 2867 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2859 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10885", "outputIndexes": +[ 2868 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2861 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10888", "outputIndexes": +[ 2869 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2857, 2868, 2869, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10891", "outputIndexes": +[ 2870 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2870 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10892", "outputIndexes": +[ 2871 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2871 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10893", "outputIndexes": +[ 2872 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2872, 2871 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10894", "outputIndexes": +[ 2873 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2856, 2873, 2859 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_1_output_0", "outputIndexes": +[ 2874 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2874, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_1_output_0", "outputIndexes": +[ 2875 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2867, 2875, 34, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_output_0", "outputIndexes": +[ 2876 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2855, 2876 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_output_0", "outputIndexes": +[ 2877 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2877 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 421102368, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.25/self_attn/q_norm/Mul_1_output_0", "outputIndexes": +[ 2879 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2879, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_output_0", "outputIndexes": +[ 2880 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2879 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_2_output_0", "outputIndexes": +[ 2881 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2881 ] +, "main_type": "NONE", "name": "Shape10981", "outputIndexes": +[ 2882 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2881 ] +, "main_type": "NONE", "name": "Rank10983", "outputIndexes": +[ 2883 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2883, 2883 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10985", "outputIndexes": +[ 2884 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2884 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10986", "outputIndexes": +[ 2885 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2884, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10988", "outputIndexes": +[ 2886 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2886 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10989", "outputIndexes": +[ 2887 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2882, 2885, 2887, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10992", "outputIndexes": +[ 2888 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2888 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10993", "outputIndexes": +[ 2889 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2889 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10994", "outputIndexes": +[ 2890 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2890, 2889 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10995", "outputIndexes": +[ 2891 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2881, 2891, 2884 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_2_output_0", "outputIndexes": +[ 2892 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2892, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Div_output_0", "outputIndexes": +[ 2893 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2893, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_7_output_0", "outputIndexes": +[ 2894 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2879, 2894, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_1_output_0", "outputIndexes": +[ 2895 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2895 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.25/self_attn/Neg_output_0", "outputIndexes": +[ 2896 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2893, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_6_output_0", "outputIndexes": +[ 2897 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2879, 24, 2897, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_output_0", "outputIndexes": +[ 2898 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2896, 2898 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.25/self_attn/Concat_3_output_0", "outputIndexes": +[ 2899 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2899, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_1_output_0", "outputIndexes": +[ 2900 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2880, 2900 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Add_output_0", "outputIndexes": +[ 2901 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3669 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 421104416, 147478, 36864, 0, 0 ] + } +, "name": "/layers.25/self_attn/k_proj/Linear", "outputIndexes": +[ 3674 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3674 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "outputIndexes": +[ 3675 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3675 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "outputIndexes": +[ 2902 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2866, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_2_output_0", "outputIndexes": +[ 2903 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2874, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_3_output_0", "outputIndexes": +[ 2904 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2903, 2904, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_1_output_0", "outputIndexes": +[ 2905 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2902, 2905 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_1_output_0", "outputIndexes": +[ 2906 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2906 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 421288758, 1024, 1024 ] +, "useRMSNorm": true } +, "name": "/blocks.25/self_attn/k_norm/Mul_1_output_0", "outputIndexes": +[ 2908 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2908, 63 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_2_output_0", "outputIndexes": +[ 2909 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2908 ] +, "main_type": "NONE", "name": "/blocks.25/self_attn/Shape_3_output_0", "outputIndexes": +[ 2910 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2910 ] +, "main_type": "NONE", "name": "Shape10910", "outputIndexes": +[ 2911 ] +, "type": "Shape", "defaultDimentionFormat": "NCHW" } +, +{ "inputIndexes": +[ 2910 ] +, "main_type": "NONE", "name": "Rank10912", "outputIndexes": +[ 2912 ] +, "type": "Rank", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2912, 2912 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10914", "outputIndexes": +[ 2913 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2913 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10915", "outputIndexes": +[ 2914 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2913, 16 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10917", "outputIndexes": +[ 2915 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2915 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze10918", "outputIndexes": +[ 2916 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2911, 2914, 2916, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice10921", "outputIndexes": +[ 2917 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2917 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze10922", "outputIndexes": +[ 2918 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 66, 2918 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10923", "outputIndexes": +[ 2919 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2919, 2918 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp10924", "outputIndexes": +[ 2920 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2910, 2920, 2913 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/blocks.25/self_attn/Gather_3_output_0", "outputIndexes": +[ 2921 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2921, 78 ] +, "main_type": "BinaryOp", "main": +{ "opType": "REALDIV", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Div_1_output_0", "outputIndexes": +[ 2922 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2922, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_9_output_0", "outputIndexes": +[ 2923 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2908, 2923, 81, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_3_output_0", "outputIndexes": +[ 2924 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2924 ] +, "main_type": "UnaryOp", "main": +{ "opType": "NEG", "T": "DT_FLOAT" } +, "name": "/blocks.25/self_attn/Neg_1_output_0", "outputIndexes": +[ 2925 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2922, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_8_output_0", "outputIndexes": +[ 2926 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2908, 24, 2926, 82, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/blocks.25/self_attn/Slice_2_output_0", "outputIndexes": +[ 2927 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2925, 2927 ] +, "main_type": "Axis", "main": +{ "axis": -1 } +, "name": "/blocks.25/self_attn/Concat_4_output_0", "outputIndexes": +[ 2928 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2928, 94 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Mul_3_output_0", "outputIndexes": +[ 2929 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2909, 2929 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/self_attn/Add_1_output_0", "outputIndexes": +[ 2930 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3669 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 256, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4608, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 421290806, 147478, 36864, 0, 0 ] + } +, "name": "/layers.25/self_attn/v_proj/Linear", "outputIndexes": +[ 3678 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3678 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "outputIndexes": +[ 3679 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3679 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 256 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "outputIndexes": +[ 2931 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2866, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_4_output_0", "outputIndexes": +[ 2932 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2874, 24 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "/blocks.25/self_attn/Unsqueeze_5_output_0", "outputIndexes": +[ 2933 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2932, 2933, 19, 35 ] +, "main_type": "Axis", "main": +{ "axis": 0 } +, "name": "/blocks.25/self_attn/Concat_2_output_0", "outputIndexes": +[ 2934 ] +, "type": "Concat", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2931, 2934 ] +, "main_type": "Reshape", "main": +{ "dimType": "NCHW" } +, "name": "/blocks.25/self_attn/Reshape_2_output_0", "outputIndexes": +[ 2935 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 134 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze11102", "outputIndexes": +[ 2936 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 136 ] +, "main_type": "SqueezeParam", "main": +{ "squeezeDims": +[ 0 ] + } +, "name": "Unsqueeze11105", "outputIndexes": +[ 2937 ] +, "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 132, 2936, 2937, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } +, "name": "StridedSlice11108", "outputIndexes": +[ 2938 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2938 ] +, "main_type": "SqueezeParam", "main": +{ } +, "name": "Squeeze11109", "outputIndexes": +[ 2939 ] +, "type": "Squeeze", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 16, 2939 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp11110", "outputIndexes": +[ 2940 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2940, 2939 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MOD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "BinaryOp11111", "outputIndexes": +[ 2941 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 131, 2941, 134 ] +, "main_type": "GatherV2", "main": +{ "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } +, "name": "/Gather_51_output_0", "outputIndexes": +[ 2942 ] +, "type": "GatherV2", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2901, 2930, 2935, 2942 ] +, "main_type": "AttentionParam", "main": +{ "kv_cache": true } +, "name": "Attention/blocks.25/self_attn/Reshape_7_output_0", "outputIndexes": +[ 2943 ] +, "type": "Attention", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2943 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1024, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": +[ 3680 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3680 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "outputIndexes": +[ 3681 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3681 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 1024, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 18432, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 421475148, 589846, 147456, 0, 0 ] + } +, "name": "/layers.25/self_attn/o_proj/Linear", "outputIndexes": +[ 3682 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3682 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "outputIndexes": +[ 3683 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3683 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "outputIndexes": +[ 2944 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2944 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 422212450, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.25/post_attention_layernorm/Mul_1_output_0", "outputIndexes": +[ 2946 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2853, 2946 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/Add_output_0", "outputIndexes": +[ 2947 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2947 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 422221666, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.25/pre_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2948 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2948 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": +[ 3684 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3684 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "outputIndexes": +[ 3685 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3685 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 422230882, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.25/mlp/gate_proj/Linear", "outputIndexes": +[ 3686 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3686 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "outputIndexes": +[ 3687 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3687 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "outputIndexes": +[ 2949 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2949 ] +, "main_type": "UnaryOp", "main": +{ "opType": "SQUARE", "T": "DT_INVALID" } +, "name": "/blocks.25/mlp/act_fn/Mul_output_0", "outputIndexes": +[ 2950 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2949, 2950 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Mul_1_output_0", "outputIndexes": +[ 2951 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 153, 2951 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Mul_2_output_0", "outputIndexes": +[ 2952 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2949, 2952 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Add_output_0", "outputIndexes": +[ 2953 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 152, 2953 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Mul_3_output_0", "outputIndexes": +[ 2954 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2954 ] +, "main_type": "UnaryOp", "main": +{ "opType": "TANH", "T": "DT_INVALID" } +, "name": "/blocks.25/mlp/act_fn/Tanh_output_0", "outputIndexes": +[ 2955 ] +, "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 151, 2955 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Add_1_output_0", "outputIndexes": +[ 2956 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2949, 2956 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Mul_4_output_0", "outputIndexes": +[ 2957 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 148, 2957 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/act_fn/Mul_5_output_0", "outputIndexes": +[ 2958 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3685 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 6912, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 427207544, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.25/mlp/up_proj/Linear", "outputIndexes": +[ 3690 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3690 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/up_proj/Linear/post_convert", "outputIndexes": +[ 3691 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3691 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 6912 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "outputIndexes": +[ 2959 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2958, 2959 ] +, "main_type": "BinaryOp", "main": +{ "opType": "MUL", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/mlp/Mul_output_0", "outputIndexes": +[ 2960 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2960 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 6912, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "outputIndexes": +[ 3692 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3692 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "outputIndexes": +[ 3693 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3693 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 1152, "inputCount": 6912, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 124416, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } +, "external": +[ 432184206, 3981334, 995328, 0, 0 ] + } +, "name": "/layers.25/mlp/down_proj/Linear", "outputIndexes": +[ 3694 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3694 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/post_convert", "outputIndexes": +[ 3695 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3695 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 1152 ] +, "dimType": "NCHW" } +, "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "outputIndexes": +[ 2961 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2961 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 437160868, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "/blocks.25/post_feedforward_layernorm/Mul_1_output_0", "outputIndexes": +[ 2963 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2947, 2963 ] +, "main_type": "BinaryOp", "main": +{ "opType": "ADD", "T": "DT_FLOAT", "activationType": 0 } +, "name": "/blocks.25/Add_1_output_0", "outputIndexes": +[ 2964 ] +, "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2964, 3, 81, 19, 19 ] +, "main_type": "StridedSliceParam", "main": +{ "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } +, "name": "/Slice_output_0", "outputIndexes": +[ 2965 ] +, "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2965 ] +, "main_type": "LayerNorm", "main": +{ "axis": +[ -1 ] +, "epsilon": 0.000001, "group": 1, "external": +[ 437170084, 4608, 4608 ] +, "useRMSNorm": true } +, "name": "hidden_states", "outputIndexes": +[ 2966 ] +, "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 2966 ] +, "main_type": "Reshape", "main": +{ "dims": +[ -1, 1152, 1, 1 ] +, "dimType": "NCHW" } +, "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": +[ 3696 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3696 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NCHW", "dest": "NC4HW4" } +, "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": +[ 3697 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3697 ] +, "main_type": "Convolution2D", "main": +{ "common": +{ "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 262144, "inputCount": 1152, "relu": false, "relu6": false, "hasOutputShape": false } +, "quanParameter": +{ "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 4718592, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } +, "external": +[ 437179300, 150994970, 37748736, 0, 0 ] + } +, "name": "/lm/lm_head/Linear", "outputIndexes": +[ 3698 ] +, "type": "Convolution", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3698 ] +, "main_type": "TensorConvertInfo", "main": +{ "source": "NC4HW4", "dest": "NCHW" } +, "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": +[ 3699 ] +, "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } +, +{ "inputIndexes": +[ 3699 ] +, "main_type": "Reshape", "main": +{ "dims": +[ 1, -1, 262144 ] +, "dimType": "NCHW" } +, "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": +[ 2967 ] +, "type": "Reshape", "defaultDimentionFormat": "NHWC" } + ] +, "outputName": +[ "logits", "hidden_states", "presents" ] +, "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": +[ "past_key_values", "presents", "position_ids", "logits_index", "input_ids", "/Constant_output_0", "/Mul_output_0", "/blocks.0/Constant_output_0", "/blocks.0/Reshape_output_0", "/blocks.0/input_layernorm/Mul_1_output_0", "/blocks.0/self_attn/q_proj/FakeLinear_output_0", "/blocks.0/self_attn/Shape_output_0", "Shape53", "Rank55", "BinaryOp57", "Unsqueeze58", "Const9", "BinaryOp60", "Unsqueeze61", "Unsqueeze63", "StridedSlice64", "Squeeze65", "BinaryOp67", "/blocks.0/self_attn/Gather_output_0", "/rotary/Constant_4_output_0", "/blocks.0/self_attn/Unsqueeze_output_0", "Unsqueeze77", "Unsqueeze80", "StridedSlice83", "Squeeze84", "BinaryOp85", "BinaryOp86", "/blocks.0/self_attn/Gather_1_output_0", "/blocks.0/self_attn/Unsqueeze_1_output_0", "/blocks.0/self_attn/Constant_3_output_0", "/blocks.0/self_attn/Constant_4_output_0", "/blocks.0/self_attn/Concat_output_0", "/blocks.0/self_attn/Reshape_output_0", "/blocks.0/self_attn/q_norm/Cast_output_0", "/blocks.0/self_attn/q_norm/Mul_1_output_0", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_2_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_7_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape117", "Rank119", "BinaryOp121", "Unsqueeze122", "BinaryOp124", "Unsqueeze125", "StridedSlice128", "Squeeze129", "BinaryOp131", "/blocks.0/self_attn/Gather_2_output_0", "/blocks.0/self_attn/Mul_output_0", "/blocks.0/self_attn/Shape_2_output_0", "/blocks.0/self_attn/Constant_9_output_0", "Shape257", "Rank259", "BinaryOp261", "Unsqueeze262", "BinaryOp264", "Unsqueeze265", "StridedSlice268", "Squeeze269", "BinaryOp270", "BinaryOp271", "/blocks.0/self_attn/Gather_4_output_0", "/rotary/Constant_6_output_0", "/blocks.0/self_attn/Div_output_0", "/blocks.0/self_attn/Unsqueeze_7_output_0", "/blocks.0/self_attn/Constant_18_output_0", "/blocks.0/self_attn/Constant_12_output_0", "/blocks.0/self_attn/Slice_1_output_0", "/blocks.0/self_attn/Neg_output_0", "/blocks.0/self_attn/Unsqueeze_6_output_0", "/blocks.0/self_attn/Slice_output_0", "/blocks.0/self_attn/Concat_3_output_0", "Unsqueeze168", "Unsqueeze171", "StridedSlice174", "Squeeze175", "BinaryOp176", "BinaryOp177", "/blocks.0/self_attn/Gather_3_output_0", "/blocks.0/self_attn/Mul_1_output_0", "/blocks.0/self_attn/Add_output_0", "/blocks.0/self_attn/k_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_2_output_0", "/blocks.0/self_attn/Unsqueeze_3_output_0", "/blocks.0/self_attn/Concat_1_output_0", "/blocks.0/self_attn/Reshape_1_output_0", "/blocks.0/self_attn/k_norm/Cast_output_0", "/blocks.0/self_attn/k_norm/Mul_1_output_0", "/blocks.0/self_attn/Mul_2_output_0", "/blocks.0/self_attn/Shape_3_output_0", "Shape136", "Rank138", "BinaryOp140", "Unsqueeze141", "BinaryOp143", "Unsqueeze144", "StridedSlice147", "Squeeze148", "BinaryOp149", "BinaryOp150", "/blocks.0/self_attn/Gather_5_output_0", "/blocks.0/self_attn/Div_1_output_0", "/blocks.0/self_attn/Unsqueeze_9_output_0", "/blocks.0/self_attn/Slice_3_output_0", "/blocks.0/self_attn/Neg_1_output_0", "/blocks.0/self_attn/Unsqueeze_8_output_0", "/blocks.0/self_attn/Slice_2_output_0", "/blocks.0/self_attn/Concat_4_output_0", "/blocks.0/self_attn/Mul_3_output_0", "/blocks.0/self_attn/Add_1_output_0", "/blocks.0/self_attn/v_proj/FakeLinear_output_0", "/blocks.0/self_attn/Unsqueeze_4_output_0", "/blocks.0/self_attn/Unsqueeze_5_output_0", "/blocks.0/self_attn/Concat_2_output_0", "/blocks.0/self_attn/Reshape_2_output_0", "attention_mask", "Shape378", "Rank380", "BinaryOp382", "Unsqueeze383", "BinaryOp385", "Unsqueeze386", "StridedSlice389", "Squeeze390", "BinaryOp391", "BinaryOp392", "/Gather_1_output_0", "/blocks.0/self_attn/Reshape_7_output_0", "/blocks.0/self_attn/o_proj/FakeLinear_output_0", "/blocks.0/post_attention_layernorm/Cast_output_0", "/blocks.0/post_attention_layernorm/Mul_1_output_0", "/blocks.0/Add_output_0", "/blocks.0/mlp/act_fn/Constant_3_output_0", "/blocks.0/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.0/mlp/gate_proj/FakeLinear_output_0", "/blocks.0/input_layernorm/Constant_2_output_0", "/blocks.0/mlp/act_fn/Constant_1_output_0", "/blocks.0/mlp/act_fn/Constant_output_0", "/blocks.0/mlp/act_fn/Mul_output_0", "/blocks.0/mlp/act_fn/Mul_1_output_0", "/blocks.0/mlp/act_fn/Mul_2_output_0", "/blocks.0/mlp/act_fn/Add_output_0", "/blocks.0/mlp/act_fn/Mul_3_output_0", "/blocks.0/mlp/act_fn/Tanh_output_0", "/blocks.0/mlp/act_fn/Add_1_output_0", "/blocks.0/mlp/act_fn/Mul_4_output_0", "/blocks.0/mlp/act_fn/Mul_5_output_0", "/blocks.0/mlp/up_proj/FakeLinear_output_0", "/blocks.0/mlp/Mul_output_0", "/blocks.0/mlp/down_proj/FakeLinear_output_0", "/blocks.0/post_feedforward_layernorm/Cast_output_0", "/blocks.0/post_feedforward_layernorm/Mul_1_output_0", "/blocks.0/Add_1_output_0", "/blocks.1/Reshape_output_0", "/blocks.1/input_layernorm/Mul_1_output_0", "/blocks.1/self_attn/q_proj/FakeLinear_output_0", "/blocks.1/self_attn/Shape_output_0", "Shape546", "Rank548", "BinaryOp550", "Unsqueeze551", "BinaryOp553", "Unsqueeze554", "StridedSlice557", "Squeeze558", "BinaryOp560", "/blocks.1/self_attn/Gather_output_0", "/blocks.1/self_attn/Unsqueeze_output_0", "Unsqueeze568", "Unsqueeze571", "StridedSlice574", "Squeeze575", "BinaryOp576", "BinaryOp577", "/blocks.1/self_attn/Gather_1_output_0", "/blocks.1/self_attn/Unsqueeze_1_output_0", "/blocks.1/self_attn/Concat_output_0", "/blocks.1/self_attn/Reshape_output_0", "/blocks.1/self_attn/q_norm/Cast_output_0", "/blocks.1/self_attn/q_norm/Mul_1_output_0", "/blocks.1/self_attn/Mul_output_0", "/blocks.1/self_attn/Shape_2_output_0", "Shape694", "Rank696", "BinaryOp698", "Unsqueeze699", "BinaryOp701", "Unsqueeze702", "StridedSlice705", "Squeeze706", "BinaryOp707", "BinaryOp708", "/blocks.1/self_attn/Gather_2_output_0", "/blocks.1/self_attn/Div_output_0", "/blocks.1/self_attn/Unsqueeze_7_output_0", "/blocks.1/self_attn/Slice_1_output_0", "/blocks.1/self_attn/Neg_output_0", "/blocks.1/self_attn/Unsqueeze_6_output_0", "/blocks.1/self_attn/Slice_output_0", "/blocks.1/self_attn/Concat_3_output_0", "/blocks.1/self_attn/Mul_1_output_0", "/blocks.1/self_attn/Add_output_0", "/blocks.1/self_attn/k_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_2_output_0", "/blocks.1/self_attn/Unsqueeze_3_output_0", "/blocks.1/self_attn/Concat_1_output_0", "/blocks.1/self_attn/Reshape_1_output_0", "/blocks.1/self_attn/k_norm/Cast_output_0", "/blocks.1/self_attn/k_norm/Mul_1_output_0", "/blocks.1/self_attn/Mul_2_output_0", "/blocks.1/self_attn/Shape_3_output_0", "Shape593", "Rank595", "BinaryOp597", "Unsqueeze598", "BinaryOp600", "Unsqueeze601", "StridedSlice604", "Squeeze605", "BinaryOp606", "BinaryOp607", "/blocks.1/self_attn/Gather_3_output_0", "/blocks.1/self_attn/Div_1_output_0", "/blocks.1/self_attn/Unsqueeze_9_output_0", "/blocks.1/self_attn/Slice_3_output_0", "/blocks.1/self_attn/Neg_1_output_0", "/blocks.1/self_attn/Unsqueeze_8_output_0", "/blocks.1/self_attn/Slice_2_output_0", "/blocks.1/self_attn/Concat_4_output_0", "/blocks.1/self_attn/Mul_3_output_0", "/blocks.1/self_attn/Add_1_output_0", "/blocks.1/self_attn/v_proj/FakeLinear_output_0", "/blocks.1/self_attn/Unsqueeze_4_output_0", "/blocks.1/self_attn/Unsqueeze_5_output_0", "/blocks.1/self_attn/Concat_2_output_0", "/blocks.1/self_attn/Reshape_2_output_0", "Unsqueeze815", "Unsqueeze818", "StridedSlice821", "Squeeze822", "BinaryOp823", "BinaryOp824", "/Gather_3_output_0", "/blocks.1/self_attn/Reshape_7_output_0", "/blocks.1/self_attn/o_proj/FakeLinear_output_0", "/blocks.1/post_attention_layernorm/Cast_output_0", "/blocks.1/post_attention_layernorm/Mul_1_output_0", "/blocks.1/Add_output_0", "/blocks.1/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.1/mlp/gate_proj/FakeLinear_output_0", "/blocks.1/mlp/act_fn/Mul_output_0", "/blocks.1/mlp/act_fn/Mul_1_output_0", "/blocks.1/mlp/act_fn/Mul_2_output_0", "/blocks.1/mlp/act_fn/Add_output_0", "/blocks.1/mlp/act_fn/Mul_3_output_0", "/blocks.1/mlp/act_fn/Tanh_output_0", "/blocks.1/mlp/act_fn/Add_1_output_0", "/blocks.1/mlp/act_fn/Mul_4_output_0", "/blocks.1/mlp/act_fn/Mul_5_output_0", "/blocks.1/mlp/up_proj/FakeLinear_output_0", "/blocks.1/mlp/Mul_output_0", "/blocks.1/mlp/down_proj/FakeLinear_output_0", "/blocks.1/post_feedforward_layernorm/Cast_output_0", "/blocks.1/post_feedforward_layernorm/Mul_1_output_0", "/blocks.1/Add_1_output_0", "/blocks.2/Reshape_output_0", "/blocks.2/input_layernorm/Mul_1_output_0", "/blocks.2/self_attn/q_proj/FakeLinear_output_0", "/blocks.2/self_attn/Shape_output_0", "Shape975", "Rank977", "BinaryOp979", "Unsqueeze980", "BinaryOp982", "Unsqueeze983", "StridedSlice986", "Squeeze987", "BinaryOp989", "/blocks.2/self_attn/Gather_output_0", "/blocks.2/self_attn/Unsqueeze_output_0", "Unsqueeze997", "Unsqueeze1000", "StridedSlice1003", "Squeeze1004", "BinaryOp1005", "BinaryOp1006", "/blocks.2/self_attn/Gather_1_output_0", "/blocks.2/self_attn/Unsqueeze_1_output_0", "/blocks.2/self_attn/Concat_output_0", "/blocks.2/self_attn/Reshape_output_0", "/blocks.2/self_attn/q_norm/Cast_output_0", "/blocks.2/self_attn/q_norm/Mul_1_output_0", "/blocks.2/self_attn/Mul_output_0", "/blocks.2/self_attn/Shape_2_output_0", "Shape1123", "Rank1125", "BinaryOp1127", "Unsqueeze1128", "BinaryOp1130", "Unsqueeze1131", "StridedSlice1134", "Squeeze1135", "BinaryOp1136", "BinaryOp1137", "/blocks.2/self_attn/Gather_2_output_0", "/blocks.2/self_attn/Div_output_0", "/blocks.2/self_attn/Unsqueeze_7_output_0", "/blocks.2/self_attn/Slice_1_output_0", "/blocks.2/self_attn/Neg_output_0", "/blocks.2/self_attn/Unsqueeze_6_output_0", "/blocks.2/self_attn/Slice_output_0", "/blocks.2/self_attn/Concat_3_output_0", "/blocks.2/self_attn/Mul_1_output_0", "/blocks.2/self_attn/Add_output_0", "/blocks.2/self_attn/k_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_2_output_0", "/blocks.2/self_attn/Unsqueeze_3_output_0", "/blocks.2/self_attn/Concat_1_output_0", "/blocks.2/self_attn/Reshape_1_output_0", "/blocks.2/self_attn/k_norm/Cast_output_0", "/blocks.2/self_attn/k_norm/Mul_1_output_0", "/blocks.2/self_attn/Mul_2_output_0", "/blocks.2/self_attn/Shape_3_output_0", "Shape1022", "Rank1024", "BinaryOp1026", "Unsqueeze1027", "BinaryOp1029", "Unsqueeze1030", "StridedSlice1033", "Squeeze1034", "BinaryOp1035", "BinaryOp1036", "/blocks.2/self_attn/Gather_3_output_0", "/blocks.2/self_attn/Div_1_output_0", "/blocks.2/self_attn/Unsqueeze_9_output_0", "/blocks.2/self_attn/Slice_3_output_0", "/blocks.2/self_attn/Neg_1_output_0", "/blocks.2/self_attn/Unsqueeze_8_output_0", "/blocks.2/self_attn/Slice_2_output_0", "/blocks.2/self_attn/Concat_4_output_0", "/blocks.2/self_attn/Mul_3_output_0", "/blocks.2/self_attn/Add_1_output_0", "/blocks.2/self_attn/v_proj/FakeLinear_output_0", "/blocks.2/self_attn/Unsqueeze_4_output_0", "/blocks.2/self_attn/Unsqueeze_5_output_0", "/blocks.2/self_attn/Concat_2_output_0", "/blocks.2/self_attn/Reshape_2_output_0", "Unsqueeze1244", "Unsqueeze1247", "StridedSlice1250", "Squeeze1251", "BinaryOp1252", "BinaryOp1253", "/Gather_5_output_0", "/blocks.2/self_attn/Reshape_7_output_0", "/blocks.2/self_attn/o_proj/FakeLinear_output_0", "/blocks.2/post_attention_layernorm/Cast_output_0", "/blocks.2/post_attention_layernorm/Mul_1_output_0", "/blocks.2/Add_output_0", "/blocks.2/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.2/mlp/gate_proj/FakeLinear_output_0", "/blocks.2/mlp/act_fn/Mul_output_0", "/blocks.2/mlp/act_fn/Mul_1_output_0", "/blocks.2/mlp/act_fn/Mul_2_output_0", "/blocks.2/mlp/act_fn/Add_output_0", "/blocks.2/mlp/act_fn/Mul_3_output_0", "/blocks.2/mlp/act_fn/Tanh_output_0", "/blocks.2/mlp/act_fn/Add_1_output_0", "/blocks.2/mlp/act_fn/Mul_4_output_0", "/blocks.2/mlp/act_fn/Mul_5_output_0", "/blocks.2/mlp/up_proj/FakeLinear_output_0", "/blocks.2/mlp/Mul_output_0", "/blocks.2/mlp/down_proj/FakeLinear_output_0", "/blocks.2/post_feedforward_layernorm/Cast_output_0", "/blocks.2/post_feedforward_layernorm/Mul_1_output_0", "/blocks.2/Add_1_output_0", "/blocks.3/Reshape_output_0", "/blocks.3/input_layernorm/Mul_1_output_0", "/blocks.3/self_attn/q_proj/FakeLinear_output_0", "/blocks.3/self_attn/Shape_output_0", "Shape1404", "Rank1406", "BinaryOp1408", "Unsqueeze1409", "BinaryOp1411", "Unsqueeze1412", "StridedSlice1415", "Squeeze1416", "BinaryOp1418", "/blocks.3/self_attn/Gather_output_0", "/blocks.3/self_attn/Unsqueeze_output_0", "Unsqueeze1426", "Unsqueeze1429", "StridedSlice1432", "Squeeze1433", "BinaryOp1434", "BinaryOp1435", "/blocks.3/self_attn/Gather_1_output_0", "/blocks.3/self_attn/Unsqueeze_1_output_0", "/blocks.3/self_attn/Concat_output_0", "/blocks.3/self_attn/Reshape_output_0", "/blocks.3/self_attn/q_norm/Cast_output_0", "/blocks.3/self_attn/q_norm/Mul_1_output_0", "/blocks.3/self_attn/Mul_output_0", "/blocks.3/self_attn/Shape_2_output_0", "Shape1552", "Rank1554", "BinaryOp1556", "Unsqueeze1557", "BinaryOp1559", "Unsqueeze1560", "StridedSlice1563", "Squeeze1564", "BinaryOp1565", "BinaryOp1566", "/blocks.3/self_attn/Gather_2_output_0", "/blocks.3/self_attn/Div_output_0", "/blocks.3/self_attn/Unsqueeze_7_output_0", "/blocks.3/self_attn/Slice_1_output_0", "/blocks.3/self_attn/Neg_output_0", "/blocks.3/self_attn/Unsqueeze_6_output_0", "/blocks.3/self_attn/Slice_output_0", "/blocks.3/self_attn/Concat_3_output_0", "/blocks.3/self_attn/Mul_1_output_0", "/blocks.3/self_attn/Add_output_0", "/blocks.3/self_attn/k_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_2_output_0", "/blocks.3/self_attn/Unsqueeze_3_output_0", "/blocks.3/self_attn/Concat_1_output_0", "/blocks.3/self_attn/Reshape_1_output_0", "/blocks.3/self_attn/k_norm/Cast_output_0", "/blocks.3/self_attn/k_norm/Mul_1_output_0", "/blocks.3/self_attn/Mul_2_output_0", "/blocks.3/self_attn/Shape_3_output_0", "Shape1451", "Rank1453", "BinaryOp1455", "Unsqueeze1456", "BinaryOp1458", "Unsqueeze1459", "StridedSlice1462", "Squeeze1463", "BinaryOp1464", "BinaryOp1465", "/blocks.3/self_attn/Gather_3_output_0", "/blocks.3/self_attn/Div_1_output_0", "/blocks.3/self_attn/Unsqueeze_9_output_0", "/blocks.3/self_attn/Slice_3_output_0", "/blocks.3/self_attn/Neg_1_output_0", "/blocks.3/self_attn/Unsqueeze_8_output_0", "/blocks.3/self_attn/Slice_2_output_0", "/blocks.3/self_attn/Concat_4_output_0", "/blocks.3/self_attn/Mul_3_output_0", "/blocks.3/self_attn/Add_1_output_0", "/blocks.3/self_attn/v_proj/FakeLinear_output_0", "/blocks.3/self_attn/Unsqueeze_4_output_0", "/blocks.3/self_attn/Unsqueeze_5_output_0", "/blocks.3/self_attn/Concat_2_output_0", "/blocks.3/self_attn/Reshape_2_output_0", "Unsqueeze1673", "Unsqueeze1676", "StridedSlice1679", "Squeeze1680", "BinaryOp1681", "BinaryOp1682", "/Gather_7_output_0", "/blocks.3/self_attn/Reshape_7_output_0", "/blocks.3/self_attn/o_proj/FakeLinear_output_0", "/blocks.3/post_attention_layernorm/Cast_output_0", "/blocks.3/post_attention_layernorm/Mul_1_output_0", "/blocks.3/Add_output_0", "/blocks.3/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.3/mlp/gate_proj/FakeLinear_output_0", "/blocks.3/mlp/act_fn/Mul_output_0", "/blocks.3/mlp/act_fn/Mul_1_output_0", "/blocks.3/mlp/act_fn/Mul_2_output_0", "/blocks.3/mlp/act_fn/Add_output_0", "/blocks.3/mlp/act_fn/Mul_3_output_0", "/blocks.3/mlp/act_fn/Tanh_output_0", "/blocks.3/mlp/act_fn/Add_1_output_0", "/blocks.3/mlp/act_fn/Mul_4_output_0", "/blocks.3/mlp/act_fn/Mul_5_output_0", "/blocks.3/mlp/up_proj/FakeLinear_output_0", "/blocks.3/mlp/Mul_output_0", "/blocks.3/mlp/down_proj/FakeLinear_output_0", "/blocks.3/post_feedforward_layernorm/Cast_output_0", "/blocks.3/post_feedforward_layernorm/Mul_1_output_0", "/blocks.3/Add_1_output_0", "/blocks.4/Reshape_output_0", "/blocks.4/input_layernorm/Mul_1_output_0", "/blocks.4/self_attn/q_proj/FakeLinear_output_0", "/blocks.4/self_attn/Shape_output_0", "Shape1833", "Rank1835", "BinaryOp1837", "Unsqueeze1838", "BinaryOp1840", "Unsqueeze1841", "StridedSlice1844", "Squeeze1845", "BinaryOp1847", "/blocks.4/self_attn/Gather_output_0", "/blocks.4/self_attn/Unsqueeze_output_0", "Unsqueeze1855", "Unsqueeze1858", "StridedSlice1861", "Squeeze1862", "BinaryOp1863", "BinaryOp1864", "/blocks.4/self_attn/Gather_1_output_0", "/blocks.4/self_attn/Unsqueeze_1_output_0", "/blocks.4/self_attn/Concat_output_0", "/blocks.4/self_attn/Reshape_output_0", "/blocks.4/self_attn/q_norm/Cast_output_0", "/blocks.4/self_attn/q_norm/Mul_1_output_0", "/blocks.4/self_attn/Mul_output_0", "/blocks.4/self_attn/Shape_2_output_0", "Shape1982", "Rank1984", "BinaryOp1986", "Unsqueeze1987", "BinaryOp1989", "Unsqueeze1990", "StridedSlice1993", "Squeeze1994", "BinaryOp1995", "BinaryOp1996", "/blocks.4/self_attn/Gather_2_output_0", "/blocks.4/self_attn/Div_output_0", "/blocks.4/self_attn/Unsqueeze_7_output_0", "/blocks.4/self_attn/Slice_1_output_0", "/blocks.4/self_attn/Neg_output_0", "/blocks.4/self_attn/Unsqueeze_6_output_0", "/blocks.4/self_attn/Slice_output_0", "/blocks.4/self_attn/Concat_3_output_0", "/blocks.4/self_attn/Mul_1_output_0", "/blocks.4/self_attn/Add_output_0", "/blocks.4/self_attn/k_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_2_output_0", "/blocks.4/self_attn/Unsqueeze_3_output_0", "/blocks.4/self_attn/Concat_1_output_0", "/blocks.4/self_attn/Reshape_1_output_0", "/blocks.4/self_attn/k_norm/Cast_output_0", "/blocks.4/self_attn/k_norm/Mul_1_output_0", "/blocks.4/self_attn/Mul_2_output_0", "/blocks.4/self_attn/Shape_3_output_0", "Shape1880", "Rank1882", "BinaryOp1884", "Unsqueeze1885", "BinaryOp1887", "Unsqueeze1888", "StridedSlice1891", "Squeeze1892", "BinaryOp1893", "BinaryOp1894", "/blocks.4/self_attn/Gather_3_output_0", "/blocks.4/self_attn/Div_1_output_0", "/blocks.4/self_attn/Unsqueeze_9_output_0", "/blocks.4/self_attn/Slice_3_output_0", "/blocks.4/self_attn/Neg_1_output_0", "/blocks.4/self_attn/Unsqueeze_8_output_0", "/blocks.4/self_attn/Slice_2_output_0", "/blocks.4/self_attn/Concat_4_output_0", "/blocks.4/self_attn/Mul_3_output_0", "/blocks.4/self_attn/Add_1_output_0", "/blocks.4/self_attn/v_proj/FakeLinear_output_0", "/blocks.4/self_attn/Unsqueeze_4_output_0", "/blocks.4/self_attn/Unsqueeze_5_output_0", "/blocks.4/self_attn/Concat_2_output_0", "/blocks.4/self_attn/Reshape_2_output_0", "Unsqueeze2103", "Unsqueeze2106", "StridedSlice2109", "Squeeze2110", "BinaryOp2111", "BinaryOp2112", "/Gather_9_output_0", "/blocks.4/self_attn/Reshape_7_output_0", "/blocks.4/self_attn/o_proj/FakeLinear_output_0", "/blocks.4/post_attention_layernorm/Cast_output_0", "/blocks.4/post_attention_layernorm/Mul_1_output_0", "/blocks.4/Add_output_0", "/blocks.4/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.4/mlp/gate_proj/FakeLinear_output_0", "/blocks.4/mlp/act_fn/Mul_output_0", "/blocks.4/mlp/act_fn/Mul_1_output_0", "/blocks.4/mlp/act_fn/Mul_2_output_0", "/blocks.4/mlp/act_fn/Add_output_0", "/blocks.4/mlp/act_fn/Mul_3_output_0", "/blocks.4/mlp/act_fn/Tanh_output_0", "/blocks.4/mlp/act_fn/Add_1_output_0", "/blocks.4/mlp/act_fn/Mul_4_output_0", "/blocks.4/mlp/act_fn/Mul_5_output_0", "/blocks.4/mlp/up_proj/FakeLinear_output_0", "/blocks.4/mlp/Mul_output_0", "/blocks.4/mlp/down_proj/FakeLinear_output_0", "/blocks.4/post_feedforward_layernorm/Cast_output_0", "/blocks.4/post_feedforward_layernorm/Mul_1_output_0", "/blocks.4/Add_1_output_0", "/blocks.5/Reshape_output_0", "/blocks.5/input_layernorm/Mul_1_output_0", "/blocks.5/self_attn/q_proj/FakeLinear_output_0", "/blocks.5/self_attn/Shape_output_0", "Shape2263", "Rank2265", "BinaryOp2267", "Unsqueeze2268", "BinaryOp2270", "Unsqueeze2271", "StridedSlice2274", "Squeeze2275", "BinaryOp2277", "/blocks.5/self_attn/Gather_output_0", "/blocks.5/self_attn/Unsqueeze_output_0", "Unsqueeze2285", "Unsqueeze2288", "StridedSlice2291", "Squeeze2292", "BinaryOp2293", "BinaryOp2294", "/blocks.5/self_attn/Gather_1_output_0", "/blocks.5/self_attn/Unsqueeze_1_output_0", "/blocks.5/self_attn/Concat_output_0", "/blocks.5/self_attn/Reshape_output_0", "/blocks.5/self_attn/q_norm/Cast_output_0", "/blocks.5/self_attn/q_norm/Mul_1_output_0", "/blocks.5/self_attn/Mul_output_0", "/blocks.5/self_attn/Shape_2_output_0", "Shape2412", "Rank2414", "BinaryOp2416", "Unsqueeze2417", "BinaryOp2419", "Unsqueeze2420", "StridedSlice2423", "Squeeze2424", "BinaryOp2425", "BinaryOp2426", "/blocks.5/self_attn/Gather_2_output_0", "/blocks.5/self_attn/Div_output_0", "/blocks.5/self_attn/Unsqueeze_7_output_0", "/blocks.5/self_attn/Slice_1_output_0", "/blocks.5/self_attn/Neg_output_0", "/blocks.5/self_attn/Unsqueeze_6_output_0", "/blocks.5/self_attn/Slice_output_0", "/blocks.5/self_attn/Concat_3_output_0", "/blocks.5/self_attn/Mul_1_output_0", "/blocks.5/self_attn/Add_output_0", "/blocks.5/self_attn/k_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_2_output_0", "/blocks.5/self_attn/Unsqueeze_3_output_0", "/blocks.5/self_attn/Concat_1_output_0", "/blocks.5/self_attn/Reshape_1_output_0", "/blocks.5/self_attn/k_norm/Cast_output_0", "/blocks.5/self_attn/k_norm/Mul_1_output_0", "/blocks.5/self_attn/Mul_2_output_0", "/blocks.5/self_attn/Shape_3_output_0", "Shape2310", "Rank2312", "BinaryOp2314", "Unsqueeze2315", "BinaryOp2317", "Unsqueeze2318", "StridedSlice2321", "Squeeze2322", "BinaryOp2323", "BinaryOp2324", "/blocks.5/self_attn/Gather_3_output_0", "/blocks.5/self_attn/Div_1_output_0", "/blocks.5/self_attn/Unsqueeze_9_output_0", "/blocks.5/self_attn/Slice_3_output_0", "/blocks.5/self_attn/Neg_1_output_0", "/blocks.5/self_attn/Unsqueeze_8_output_0", "/blocks.5/self_attn/Slice_2_output_0", "/blocks.5/self_attn/Concat_4_output_0", "/blocks.5/self_attn/Mul_3_output_0", "/blocks.5/self_attn/Add_1_output_0", "/blocks.5/self_attn/v_proj/FakeLinear_output_0", "/blocks.5/self_attn/Unsqueeze_4_output_0", "/blocks.5/self_attn/Unsqueeze_5_output_0", "/blocks.5/self_attn/Concat_2_output_0", "/blocks.5/self_attn/Reshape_2_output_0", "Unsqueeze2533", "Unsqueeze2536", "StridedSlice2539", "Squeeze2540", "BinaryOp2542", "/Gather_11_output_0", "/blocks.5/self_attn/Reshape_7_output_0", "/blocks.5/self_attn/o_proj/FakeLinear_output_0", "/blocks.5/post_attention_layernorm/Cast_output_0", "/blocks.5/post_attention_layernorm/Mul_1_output_0", "/blocks.5/Add_output_0", "/blocks.5/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.5/mlp/gate_proj/FakeLinear_output_0", "/blocks.5/mlp/act_fn/Mul_output_0", "/blocks.5/mlp/act_fn/Mul_1_output_0", "/blocks.5/mlp/act_fn/Mul_2_output_0", "/blocks.5/mlp/act_fn/Add_output_0", "/blocks.5/mlp/act_fn/Mul_3_output_0", "/blocks.5/mlp/act_fn/Tanh_output_0", "/blocks.5/mlp/act_fn/Add_1_output_0", "/blocks.5/mlp/act_fn/Mul_4_output_0", "/blocks.5/mlp/act_fn/Mul_5_output_0", "/blocks.5/mlp/up_proj/FakeLinear_output_0", "/blocks.5/mlp/Mul_output_0", "/blocks.5/mlp/down_proj/FakeLinear_output_0", "/blocks.5/post_feedforward_layernorm/Cast_output_0", "/blocks.5/post_feedforward_layernorm/Mul_1_output_0", "/blocks.5/Add_1_output_0", "/blocks.6/Reshape_output_0", "/blocks.6/input_layernorm/Mul_1_output_0", "/blocks.6/self_attn/q_proj/FakeLinear_output_0", "/blocks.6/self_attn/Shape_output_0", "Shape2693", "Rank2695", "BinaryOp2697", "Unsqueeze2698", "BinaryOp2700", "Unsqueeze2701", "StridedSlice2704", "Squeeze2705", "BinaryOp2707", "/blocks.6/self_attn/Gather_output_0", "/blocks.6/self_attn/Unsqueeze_output_0", "Unsqueeze2715", "Unsqueeze2718", "StridedSlice2721", "Squeeze2722", "BinaryOp2723", "BinaryOp2724", "/blocks.6/self_attn/Gather_1_output_0", "/blocks.6/self_attn/Unsqueeze_1_output_0", "/blocks.6/self_attn/Concat_output_0", "/blocks.6/self_attn/Reshape_output_0", "/blocks.6/self_attn/q_norm/Cast_output_0", "/blocks.6/self_attn/q_norm/Mul_1_output_0", "/blocks.6/self_attn/Mul_output_0", "/blocks.6/self_attn/Shape_2_output_0", "Shape2842", "Rank2844", "BinaryOp2846", "Unsqueeze2847", "BinaryOp2849", "Unsqueeze2850", "StridedSlice2853", "Squeeze2854", "BinaryOp2855", "BinaryOp2856", "/blocks.6/self_attn/Gather_2_output_0", "/blocks.6/self_attn/Div_output_0", "/blocks.6/self_attn/Unsqueeze_7_output_0", "/blocks.6/self_attn/Slice_1_output_0", "/blocks.6/self_attn/Neg_output_0", "/blocks.6/self_attn/Unsqueeze_6_output_0", "/blocks.6/self_attn/Slice_output_0", "/blocks.6/self_attn/Concat_3_output_0", "/blocks.6/self_attn/Mul_1_output_0", "/blocks.6/self_attn/Add_output_0", "/blocks.6/self_attn/k_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_2_output_0", "/blocks.6/self_attn/Unsqueeze_3_output_0", "/blocks.6/self_attn/Concat_1_output_0", "/blocks.6/self_attn/Reshape_1_output_0", "/blocks.6/self_attn/k_norm/Cast_output_0", "/blocks.6/self_attn/k_norm/Mul_1_output_0", "/blocks.6/self_attn/Mul_2_output_0", "/blocks.6/self_attn/Shape_3_output_0", "Shape2740", "Rank2742", "BinaryOp2744", "Unsqueeze2745", "BinaryOp2747", "Unsqueeze2748", "StridedSlice2751", "Squeeze2752", "BinaryOp2753", "BinaryOp2754", "/blocks.6/self_attn/Gather_3_output_0", "/blocks.6/self_attn/Div_1_output_0", "/blocks.6/self_attn/Unsqueeze_9_output_0", "/blocks.6/self_attn/Slice_3_output_0", "/blocks.6/self_attn/Neg_1_output_0", "/blocks.6/self_attn/Unsqueeze_8_output_0", "/blocks.6/self_attn/Slice_2_output_0", "/blocks.6/self_attn/Concat_4_output_0", "/blocks.6/self_attn/Mul_3_output_0", "/blocks.6/self_attn/Add_1_output_0", "/blocks.6/self_attn/v_proj/FakeLinear_output_0", "/blocks.6/self_attn/Unsqueeze_4_output_0", "/blocks.6/self_attn/Unsqueeze_5_output_0", "/blocks.6/self_attn/Concat_2_output_0", "/blocks.6/self_attn/Reshape_2_output_0", "Unsqueeze2963", "Unsqueeze2966", "StridedSlice2969", "Squeeze2970", "BinaryOp2971", "BinaryOp2972", "/Gather_13_output_0", "/blocks.6/self_attn/Reshape_7_output_0", "/blocks.6/self_attn/o_proj/FakeLinear_output_0", "/blocks.6/post_attention_layernorm/Cast_output_0", "/blocks.6/post_attention_layernorm/Mul_1_output_0", "/blocks.6/Add_output_0", "/blocks.6/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.6/mlp/gate_proj/FakeLinear_output_0", "/blocks.6/mlp/act_fn/Mul_output_0", "/blocks.6/mlp/act_fn/Mul_1_output_0", "/blocks.6/mlp/act_fn/Mul_2_output_0", "/blocks.6/mlp/act_fn/Add_output_0", "/blocks.6/mlp/act_fn/Mul_3_output_0", "/blocks.6/mlp/act_fn/Tanh_output_0", "/blocks.6/mlp/act_fn/Add_1_output_0", "/blocks.6/mlp/act_fn/Mul_4_output_0", "/blocks.6/mlp/act_fn/Mul_5_output_0", "/blocks.6/mlp/up_proj/FakeLinear_output_0", "/blocks.6/mlp/Mul_output_0", "/blocks.6/mlp/down_proj/FakeLinear_output_0", "/blocks.6/post_feedforward_layernorm/Cast_output_0", "/blocks.6/post_feedforward_layernorm/Mul_1_output_0", "/blocks.6/Add_1_output_0", "/blocks.7/Reshape_output_0", "/blocks.7/input_layernorm/Mul_1_output_0", "/blocks.7/self_attn/q_proj/FakeLinear_output_0", "/blocks.7/self_attn/Shape_output_0", "Shape3123", "Rank3125", "BinaryOp3127", "Unsqueeze3128", "BinaryOp3130", "Unsqueeze3131", "StridedSlice3134", "Squeeze3135", "BinaryOp3137", "/blocks.7/self_attn/Gather_output_0", "/blocks.7/self_attn/Unsqueeze_output_0", "Unsqueeze3145", "Unsqueeze3148", "StridedSlice3151", "Squeeze3152", "BinaryOp3153", "BinaryOp3154", "/blocks.7/self_attn/Gather_1_output_0", "/blocks.7/self_attn/Unsqueeze_1_output_0", "/blocks.7/self_attn/Concat_output_0", "/blocks.7/self_attn/Reshape_output_0", "/blocks.7/self_attn/q_norm/Cast_output_0", "/blocks.7/self_attn/q_norm/Mul_1_output_0", "/blocks.7/self_attn/Mul_output_0", "/blocks.7/self_attn/Shape_2_output_0", "Shape3272", "Rank3274", "BinaryOp3276", "Unsqueeze3277", "BinaryOp3279", "Unsqueeze3280", "StridedSlice3283", "Squeeze3284", "BinaryOp3285", "BinaryOp3286", "/blocks.7/self_attn/Gather_2_output_0", "/blocks.7/self_attn/Div_output_0", "/blocks.7/self_attn/Unsqueeze_7_output_0", "/blocks.7/self_attn/Slice_1_output_0", "/blocks.7/self_attn/Neg_output_0", "/blocks.7/self_attn/Unsqueeze_6_output_0", "/blocks.7/self_attn/Slice_output_0", "/blocks.7/self_attn/Concat_3_output_0", "/blocks.7/self_attn/Mul_1_output_0", "/blocks.7/self_attn/Add_output_0", "/blocks.7/self_attn/k_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_2_output_0", "/blocks.7/self_attn/Unsqueeze_3_output_0", "/blocks.7/self_attn/Concat_1_output_0", "/blocks.7/self_attn/Reshape_1_output_0", "/blocks.7/self_attn/k_norm/Cast_output_0", "/blocks.7/self_attn/k_norm/Mul_1_output_0", "/blocks.7/self_attn/Mul_2_output_0", "/blocks.7/self_attn/Shape_3_output_0", "Shape3170", "Rank3172", "BinaryOp3174", "Unsqueeze3175", "BinaryOp3177", "Unsqueeze3178", "StridedSlice3181", "Squeeze3182", "BinaryOp3183", "BinaryOp3184", "/blocks.7/self_attn/Gather_3_output_0", "/blocks.7/self_attn/Div_1_output_0", "/blocks.7/self_attn/Unsqueeze_9_output_0", "/blocks.7/self_attn/Slice_3_output_0", "/blocks.7/self_attn/Neg_1_output_0", "/blocks.7/self_attn/Unsqueeze_8_output_0", "/blocks.7/self_attn/Slice_2_output_0", "/blocks.7/self_attn/Concat_4_output_0", "/blocks.7/self_attn/Mul_3_output_0", "/blocks.7/self_attn/Add_1_output_0", "/blocks.7/self_attn/v_proj/FakeLinear_output_0", "/blocks.7/self_attn/Unsqueeze_4_output_0", "/blocks.7/self_attn/Unsqueeze_5_output_0", "/blocks.7/self_attn/Concat_2_output_0", "/blocks.7/self_attn/Reshape_2_output_0", "Unsqueeze3393", "Unsqueeze3396", "StridedSlice3399", "Squeeze3400", "BinaryOp3401", "BinaryOp3402", "/Gather_15_output_0", "/blocks.7/self_attn/Reshape_7_output_0", "/blocks.7/self_attn/o_proj/FakeLinear_output_0", "/blocks.7/post_attention_layernorm/Cast_output_0", "/blocks.7/post_attention_layernorm/Mul_1_output_0", "/blocks.7/Add_output_0", "/blocks.7/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.7/mlp/gate_proj/FakeLinear_output_0", "/blocks.7/mlp/act_fn/Mul_output_0", "/blocks.7/mlp/act_fn/Mul_1_output_0", "/blocks.7/mlp/act_fn/Mul_2_output_0", "/blocks.7/mlp/act_fn/Add_output_0", "/blocks.7/mlp/act_fn/Mul_3_output_0", "/blocks.7/mlp/act_fn/Tanh_output_0", "/blocks.7/mlp/act_fn/Add_1_output_0", "/blocks.7/mlp/act_fn/Mul_4_output_0", "/blocks.7/mlp/act_fn/Mul_5_output_0", "/blocks.7/mlp/up_proj/FakeLinear_output_0", "/blocks.7/mlp/Mul_output_0", "/blocks.7/mlp/down_proj/FakeLinear_output_0", "/blocks.7/post_feedforward_layernorm/Cast_output_0", "/blocks.7/post_feedforward_layernorm/Mul_1_output_0", "/blocks.7/Add_1_output_0", "/blocks.8/Reshape_output_0", "/blocks.8/input_layernorm/Mul_1_output_0", "/blocks.8/self_attn/q_proj/FakeLinear_output_0", "/blocks.8/self_attn/Shape_output_0", "Shape3553", "Rank3555", "BinaryOp3557", "Unsqueeze3558", "BinaryOp3560", "Unsqueeze3561", "StridedSlice3564", "Squeeze3565", "BinaryOp3567", "/blocks.8/self_attn/Gather_output_0", "/blocks.8/self_attn/Unsqueeze_output_0", "Unsqueeze3575", "Unsqueeze3578", "StridedSlice3581", "Squeeze3582", "BinaryOp3583", "BinaryOp3584", "/blocks.8/self_attn/Gather_1_output_0", "/blocks.8/self_attn/Unsqueeze_1_output_0", "/blocks.8/self_attn/Concat_output_0", "/blocks.8/self_attn/Reshape_output_0", "/blocks.8/self_attn/q_norm/Cast_output_0", "/blocks.8/self_attn/q_norm/Mul_1_output_0", "/blocks.8/self_attn/Mul_output_0", "/blocks.8/self_attn/Shape_2_output_0", "Shape3702", "Rank3704", "BinaryOp3706", "Unsqueeze3707", "BinaryOp3709", "Unsqueeze3710", "StridedSlice3713", "Squeeze3714", "BinaryOp3715", "BinaryOp3716", "/blocks.8/self_attn/Gather_2_output_0", "/blocks.8/self_attn/Div_output_0", "/blocks.8/self_attn/Unsqueeze_7_output_0", "/blocks.8/self_attn/Slice_1_output_0", "/blocks.8/self_attn/Neg_output_0", "/blocks.8/self_attn/Unsqueeze_6_output_0", "/blocks.8/self_attn/Slice_output_0", "/blocks.8/self_attn/Concat_3_output_0", "/blocks.8/self_attn/Mul_1_output_0", "/blocks.8/self_attn/Add_output_0", "/blocks.8/self_attn/k_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_2_output_0", "/blocks.8/self_attn/Unsqueeze_3_output_0", "/blocks.8/self_attn/Concat_1_output_0", "/blocks.8/self_attn/Reshape_1_output_0", "/blocks.8/self_attn/k_norm/Cast_output_0", "/blocks.8/self_attn/k_norm/Mul_1_output_0", "/blocks.8/self_attn/Mul_2_output_0", "/blocks.8/self_attn/Shape_3_output_0", "Shape3600", "Rank3602", "BinaryOp3604", "Unsqueeze3605", "BinaryOp3607", "Unsqueeze3608", "StridedSlice3611", "Squeeze3612", "BinaryOp3613", "BinaryOp3614", "/blocks.8/self_attn/Gather_3_output_0", "/blocks.8/self_attn/Div_1_output_0", "/blocks.8/self_attn/Unsqueeze_9_output_0", "/blocks.8/self_attn/Slice_3_output_0", "/blocks.8/self_attn/Neg_1_output_0", "/blocks.8/self_attn/Unsqueeze_8_output_0", "/blocks.8/self_attn/Slice_2_output_0", "/blocks.8/self_attn/Concat_4_output_0", "/blocks.8/self_attn/Mul_3_output_0", "/blocks.8/self_attn/Add_1_output_0", "/blocks.8/self_attn/v_proj/FakeLinear_output_0", "/blocks.8/self_attn/Unsqueeze_4_output_0", "/blocks.8/self_attn/Unsqueeze_5_output_0", "/blocks.8/self_attn/Concat_2_output_0", "/blocks.8/self_attn/Reshape_2_output_0", "Unsqueeze3823", "Unsqueeze3826", "StridedSlice3829", "Squeeze3830", "BinaryOp3831", "BinaryOp3832", "/Gather_17_output_0", "/blocks.8/self_attn/Reshape_7_output_0", "/blocks.8/self_attn/o_proj/FakeLinear_output_0", "/blocks.8/post_attention_layernorm/Cast_output_0", "/blocks.8/post_attention_layernorm/Mul_1_output_0", "/blocks.8/Add_output_0", "/blocks.8/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.8/mlp/gate_proj/FakeLinear_output_0", "/blocks.8/mlp/act_fn/Mul_output_0", "/blocks.8/mlp/act_fn/Mul_1_output_0", "/blocks.8/mlp/act_fn/Mul_2_output_0", "/blocks.8/mlp/act_fn/Add_output_0", "/blocks.8/mlp/act_fn/Mul_3_output_0", "/blocks.8/mlp/act_fn/Tanh_output_0", "/blocks.8/mlp/act_fn/Add_1_output_0", "/blocks.8/mlp/act_fn/Mul_4_output_0", "/blocks.8/mlp/act_fn/Mul_5_output_0", "/blocks.8/mlp/up_proj/FakeLinear_output_0", "/blocks.8/mlp/Mul_output_0", "/blocks.8/mlp/down_proj/FakeLinear_output_0", "/blocks.8/post_feedforward_layernorm/Cast_output_0", "/blocks.8/post_feedforward_layernorm/Mul_1_output_0", "/blocks.8/Add_1_output_0", "/blocks.9/Reshape_output_0", "/blocks.9/input_layernorm/Mul_1_output_0", "/blocks.9/self_attn/q_proj/FakeLinear_output_0", "/blocks.9/self_attn/Shape_output_0", "Shape3983", "Rank3985", "BinaryOp3987", "Unsqueeze3988", "BinaryOp3990", "Unsqueeze3991", "StridedSlice3994", "Squeeze3995", "BinaryOp3997", "/blocks.9/self_attn/Gather_output_0", "/blocks.9/self_attn/Unsqueeze_output_0", "Unsqueeze4005", "Unsqueeze4008", "StridedSlice4011", "Squeeze4012", "BinaryOp4013", "BinaryOp4014", "/blocks.9/self_attn/Gather_1_output_0", "/blocks.9/self_attn/Unsqueeze_1_output_0", "/blocks.9/self_attn/Concat_output_0", "/blocks.9/self_attn/Reshape_output_0", "/blocks.9/self_attn/q_norm/Cast_output_0", "/blocks.9/self_attn/q_norm/Mul_1_output_0", "/blocks.9/self_attn/Mul_output_0", "/blocks.9/self_attn/Shape_2_output_0", "Shape4132", "Rank4134", "BinaryOp4136", "Unsqueeze4137", "BinaryOp4139", "Unsqueeze4140", "StridedSlice4143", "Squeeze4144", "BinaryOp4145", "BinaryOp4146", "/blocks.9/self_attn/Gather_2_output_0", "/blocks.9/self_attn/Div_output_0", "/blocks.9/self_attn/Unsqueeze_7_output_0", "/blocks.9/self_attn/Slice_1_output_0", "/blocks.9/self_attn/Neg_output_0", "/blocks.9/self_attn/Unsqueeze_6_output_0", "/blocks.9/self_attn/Slice_output_0", "/blocks.9/self_attn/Concat_3_output_0", "/blocks.9/self_attn/Mul_1_output_0", "/blocks.9/self_attn/Add_output_0", "/blocks.9/self_attn/k_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_2_output_0", "/blocks.9/self_attn/Unsqueeze_3_output_0", "/blocks.9/self_attn/Concat_1_output_0", "/blocks.9/self_attn/Reshape_1_output_0", "/blocks.9/self_attn/k_norm/Cast_output_0", "/blocks.9/self_attn/k_norm/Mul_1_output_0", "/blocks.9/self_attn/Mul_2_output_0", "/blocks.9/self_attn/Shape_3_output_0", "Shape4030", "Rank4032", "BinaryOp4034", "Unsqueeze4035", "BinaryOp4037", "Unsqueeze4038", "StridedSlice4041", "Squeeze4042", "BinaryOp4043", "BinaryOp4044", "/blocks.9/self_attn/Gather_3_output_0", "/blocks.9/self_attn/Div_1_output_0", "/blocks.9/self_attn/Unsqueeze_9_output_0", "/blocks.9/self_attn/Slice_3_output_0", "/blocks.9/self_attn/Neg_1_output_0", "/blocks.9/self_attn/Unsqueeze_8_output_0", "/blocks.9/self_attn/Slice_2_output_0", "/blocks.9/self_attn/Concat_4_output_0", "/blocks.9/self_attn/Mul_3_output_0", "/blocks.9/self_attn/Add_1_output_0", "/blocks.9/self_attn/v_proj/FakeLinear_output_0", "/blocks.9/self_attn/Unsqueeze_4_output_0", "/blocks.9/self_attn/Unsqueeze_5_output_0", "/blocks.9/self_attn/Concat_2_output_0", "/blocks.9/self_attn/Reshape_2_output_0", "Unsqueeze4253", "Unsqueeze4256", "StridedSlice4259", "Squeeze4260", "BinaryOp4261", "BinaryOp4262", "/Gather_19_output_0", "/blocks.9/self_attn/Reshape_7_output_0", "/blocks.9/self_attn/o_proj/FakeLinear_output_0", "/blocks.9/post_attention_layernorm/Cast_output_0", "/blocks.9/post_attention_layernorm/Mul_1_output_0", "/blocks.9/Add_output_0", "/blocks.9/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.9/mlp/gate_proj/FakeLinear_output_0", "/blocks.9/mlp/act_fn/Mul_output_0", "/blocks.9/mlp/act_fn/Mul_1_output_0", "/blocks.9/mlp/act_fn/Mul_2_output_0", "/blocks.9/mlp/act_fn/Add_output_0", "/blocks.9/mlp/act_fn/Mul_3_output_0", "/blocks.9/mlp/act_fn/Tanh_output_0", "/blocks.9/mlp/act_fn/Add_1_output_0", "/blocks.9/mlp/act_fn/Mul_4_output_0", "/blocks.9/mlp/act_fn/Mul_5_output_0", "/blocks.9/mlp/up_proj/FakeLinear_output_0", "/blocks.9/mlp/Mul_output_0", "/blocks.9/mlp/down_proj/FakeLinear_output_0", "/blocks.9/post_feedforward_layernorm/Cast_output_0", "/blocks.9/post_feedforward_layernorm/Mul_1_output_0", "/blocks.9/Add_1_output_0", "/blocks.10/Reshape_output_0", "/blocks.10/input_layernorm/Mul_1_output_0", "/blocks.10/self_attn/q_proj/FakeLinear_output_0", "/blocks.10/self_attn/Shape_output_0", "Shape4413", "Rank4415", "BinaryOp4417", "Unsqueeze4418", "BinaryOp4420", "Unsqueeze4421", "StridedSlice4424", "Squeeze4425", "BinaryOp4427", "/blocks.10/self_attn/Gather_output_0", "/blocks.10/self_attn/Unsqueeze_output_0", "Unsqueeze4435", "Unsqueeze4438", "StridedSlice4441", "Squeeze4442", "BinaryOp4443", "BinaryOp4444", "/blocks.10/self_attn/Gather_1_output_0", "/blocks.10/self_attn/Unsqueeze_1_output_0", "/blocks.10/self_attn/Concat_output_0", "/blocks.10/self_attn/Reshape_output_0", "/blocks.10/self_attn/q_norm/Cast_output_0", "/blocks.10/self_attn/q_norm/Mul_1_output_0", "/blocks.10/self_attn/Mul_output_0", "/blocks.10/self_attn/Shape_2_output_0", "Shape4562", "Rank4564", "BinaryOp4566", "Unsqueeze4567", "BinaryOp4569", "Unsqueeze4570", "StridedSlice4573", "Squeeze4574", "BinaryOp4575", "BinaryOp4576", "/blocks.10/self_attn/Gather_2_output_0", "/blocks.10/self_attn/Div_output_0", "/blocks.10/self_attn/Unsqueeze_7_output_0", "/blocks.10/self_attn/Slice_1_output_0", "/blocks.10/self_attn/Neg_output_0", "/blocks.10/self_attn/Unsqueeze_6_output_0", "/blocks.10/self_attn/Slice_output_0", "/blocks.10/self_attn/Concat_3_output_0", "/blocks.10/self_attn/Mul_1_output_0", "/blocks.10/self_attn/Add_output_0", "/blocks.10/self_attn/k_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_2_output_0", "/blocks.10/self_attn/Unsqueeze_3_output_0", "/blocks.10/self_attn/Concat_1_output_0", "/blocks.10/self_attn/Reshape_1_output_0", "/blocks.10/self_attn/k_norm/Cast_output_0", "/blocks.10/self_attn/k_norm/Mul_1_output_0", "/blocks.10/self_attn/Mul_2_output_0", "/blocks.10/self_attn/Shape_3_output_0", "Shape4460", "Rank4462", "BinaryOp4464", "Unsqueeze4465", "BinaryOp4467", "Unsqueeze4468", "StridedSlice4471", "Squeeze4472", "BinaryOp4473", "BinaryOp4474", "/blocks.10/self_attn/Gather_3_output_0", "/blocks.10/self_attn/Div_1_output_0", "/blocks.10/self_attn/Unsqueeze_9_output_0", "/blocks.10/self_attn/Slice_3_output_0", "/blocks.10/self_attn/Neg_1_output_0", "/blocks.10/self_attn/Unsqueeze_8_output_0", "/blocks.10/self_attn/Slice_2_output_0", "/blocks.10/self_attn/Concat_4_output_0", "/blocks.10/self_attn/Mul_3_output_0", "/blocks.10/self_attn/Add_1_output_0", "/blocks.10/self_attn/v_proj/FakeLinear_output_0", "/blocks.10/self_attn/Unsqueeze_4_output_0", "/blocks.10/self_attn/Unsqueeze_5_output_0", "/blocks.10/self_attn/Concat_2_output_0", "/blocks.10/self_attn/Reshape_2_output_0", "Unsqueeze4683", "Unsqueeze4686", "StridedSlice4689", "Squeeze4690", "BinaryOp4691", "BinaryOp4692", "/Gather_21_output_0", "/blocks.10/self_attn/Reshape_7_output_0", "/blocks.10/self_attn/o_proj/FakeLinear_output_0", "/blocks.10/post_attention_layernorm/Cast_output_0", "/blocks.10/post_attention_layernorm/Mul_1_output_0", "/blocks.10/Add_output_0", "/blocks.10/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.10/mlp/gate_proj/FakeLinear_output_0", "/blocks.10/mlp/act_fn/Mul_output_0", "/blocks.10/mlp/act_fn/Mul_1_output_0", "/blocks.10/mlp/act_fn/Mul_2_output_0", "/blocks.10/mlp/act_fn/Add_output_0", "/blocks.10/mlp/act_fn/Mul_3_output_0", "/blocks.10/mlp/act_fn/Tanh_output_0", "/blocks.10/mlp/act_fn/Add_1_output_0", "/blocks.10/mlp/act_fn/Mul_4_output_0", "/blocks.10/mlp/act_fn/Mul_5_output_0", "/blocks.10/mlp/up_proj/FakeLinear_output_0", "/blocks.10/mlp/Mul_output_0", "/blocks.10/mlp/down_proj/FakeLinear_output_0", "/blocks.10/post_feedforward_layernorm/Cast_output_0", "/blocks.10/post_feedforward_layernorm/Mul_1_output_0", "/blocks.10/Add_1_output_0", "/blocks.11/Reshape_output_0", "/blocks.11/input_layernorm/Mul_1_output_0", "/blocks.11/self_attn/q_proj/FakeLinear_output_0", "/blocks.11/self_attn/Shape_output_0", "Shape4843", "Rank4845", "BinaryOp4847", "Unsqueeze4848", "BinaryOp4850", "Unsqueeze4851", "StridedSlice4854", "Squeeze4855", "BinaryOp4857", "/blocks.11/self_attn/Gather_output_0", "/blocks.11/self_attn/Unsqueeze_output_0", "Unsqueeze4865", "Unsqueeze4868", "StridedSlice4871", "Squeeze4872", "BinaryOp4873", "BinaryOp4874", "/blocks.11/self_attn/Gather_1_output_0", "/blocks.11/self_attn/Unsqueeze_1_output_0", "/blocks.11/self_attn/Concat_output_0", "/blocks.11/self_attn/Reshape_output_0", "/blocks.11/self_attn/q_norm/Cast_output_0", "/blocks.11/self_attn/q_norm/Mul_1_output_0", "/blocks.11/self_attn/Mul_output_0", "/blocks.11/self_attn/Shape_2_output_0", "Shape4992", "Rank4994", "BinaryOp4996", "Unsqueeze4997", "BinaryOp4999", "Unsqueeze5000", "StridedSlice5003", "Squeeze5004", "BinaryOp5005", "BinaryOp5006", "/blocks.11/self_attn/Gather_2_output_0", "/blocks.11/self_attn/Div_output_0", "/blocks.11/self_attn/Unsqueeze_7_output_0", "/blocks.11/self_attn/Slice_1_output_0", "/blocks.11/self_attn/Neg_output_0", "/blocks.11/self_attn/Unsqueeze_6_output_0", "/blocks.11/self_attn/Slice_output_0", "/blocks.11/self_attn/Concat_3_output_0", "/blocks.11/self_attn/Mul_1_output_0", "/blocks.11/self_attn/Add_output_0", "/blocks.11/self_attn/k_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_2_output_0", "/blocks.11/self_attn/Unsqueeze_3_output_0", "/blocks.11/self_attn/Concat_1_output_0", "/blocks.11/self_attn/Reshape_1_output_0", "/blocks.11/self_attn/k_norm/Cast_output_0", "/blocks.11/self_attn/k_norm/Mul_1_output_0", "/blocks.11/self_attn/Mul_2_output_0", "/blocks.11/self_attn/Shape_3_output_0", "Shape4890", "Rank4892", "BinaryOp4894", "Unsqueeze4895", "BinaryOp4897", "Unsqueeze4898", "StridedSlice4901", "Squeeze4902", "BinaryOp4903", "BinaryOp4904", "/blocks.11/self_attn/Gather_3_output_0", "/blocks.11/self_attn/Div_1_output_0", "/blocks.11/self_attn/Unsqueeze_9_output_0", "/blocks.11/self_attn/Slice_3_output_0", "/blocks.11/self_attn/Neg_1_output_0", "/blocks.11/self_attn/Unsqueeze_8_output_0", "/blocks.11/self_attn/Slice_2_output_0", "/blocks.11/self_attn/Concat_4_output_0", "/blocks.11/self_attn/Mul_3_output_0", "/blocks.11/self_attn/Add_1_output_0", "/blocks.11/self_attn/v_proj/FakeLinear_output_0", "/blocks.11/self_attn/Unsqueeze_4_output_0", "/blocks.11/self_attn/Unsqueeze_5_output_0", "/blocks.11/self_attn/Concat_2_output_0", "/blocks.11/self_attn/Reshape_2_output_0", "Unsqueeze5113", "Unsqueeze5116", "StridedSlice5119", "Squeeze5120", "BinaryOp5122", "/Gather_23_output_0", "/blocks.11/self_attn/Reshape_7_output_0", "/blocks.11/self_attn/o_proj/FakeLinear_output_0", "/blocks.11/post_attention_layernorm/Cast_output_0", "/blocks.11/post_attention_layernorm/Mul_1_output_0", "/blocks.11/Add_output_0", "/blocks.11/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.11/mlp/gate_proj/FakeLinear_output_0", "/blocks.11/mlp/act_fn/Mul_output_0", "/blocks.11/mlp/act_fn/Mul_1_output_0", "/blocks.11/mlp/act_fn/Mul_2_output_0", "/blocks.11/mlp/act_fn/Add_output_0", "/blocks.11/mlp/act_fn/Mul_3_output_0", "/blocks.11/mlp/act_fn/Tanh_output_0", "/blocks.11/mlp/act_fn/Add_1_output_0", "/blocks.11/mlp/act_fn/Mul_4_output_0", "/blocks.11/mlp/act_fn/Mul_5_output_0", "/blocks.11/mlp/up_proj/FakeLinear_output_0", "/blocks.11/mlp/Mul_output_0", "/blocks.11/mlp/down_proj/FakeLinear_output_0", "/blocks.11/post_feedforward_layernorm/Cast_output_0", "/blocks.11/post_feedforward_layernorm/Mul_1_output_0", "/blocks.11/Add_1_output_0", "/blocks.12/Reshape_output_0", "/blocks.12/input_layernorm/Mul_1_output_0", "/blocks.12/self_attn/q_proj/FakeLinear_output_0", "/blocks.12/self_attn/Shape_output_0", "Shape5273", "Rank5275", "BinaryOp5277", "Unsqueeze5278", "BinaryOp5280", "Unsqueeze5281", "StridedSlice5284", "Squeeze5285", "BinaryOp5287", "/blocks.12/self_attn/Gather_output_0", "/blocks.12/self_attn/Unsqueeze_output_0", "Unsqueeze5295", "Unsqueeze5298", "StridedSlice5301", "Squeeze5302", "BinaryOp5303", "BinaryOp5304", "/blocks.12/self_attn/Gather_1_output_0", "/blocks.12/self_attn/Unsqueeze_1_output_0", "/blocks.12/self_attn/Concat_output_0", "/blocks.12/self_attn/Reshape_output_0", "/blocks.12/self_attn/q_norm/Cast_output_0", "/blocks.12/self_attn/q_norm/Mul_1_output_0", "/blocks.12/self_attn/Mul_output_0", "/blocks.12/self_attn/Shape_2_output_0", "Shape5422", "Rank5424", "BinaryOp5426", "Unsqueeze5427", "BinaryOp5429", "Unsqueeze5430", "StridedSlice5433", "Squeeze5434", "BinaryOp5435", "BinaryOp5436", "/blocks.12/self_attn/Gather_2_output_0", "/blocks.12/self_attn/Div_output_0", "/blocks.12/self_attn/Unsqueeze_7_output_0", "/blocks.12/self_attn/Slice_1_output_0", "/blocks.12/self_attn/Neg_output_0", "/blocks.12/self_attn/Unsqueeze_6_output_0", "/blocks.12/self_attn/Slice_output_0", "/blocks.12/self_attn/Concat_3_output_0", "/blocks.12/self_attn/Mul_1_output_0", "/blocks.12/self_attn/Add_output_0", "/blocks.12/self_attn/k_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_2_output_0", "/blocks.12/self_attn/Unsqueeze_3_output_0", "/blocks.12/self_attn/Concat_1_output_0", "/blocks.12/self_attn/Reshape_1_output_0", "/blocks.12/self_attn/k_norm/Cast_output_0", "/blocks.12/self_attn/k_norm/Mul_1_output_0", "/blocks.12/self_attn/Mul_2_output_0", "/blocks.12/self_attn/Shape_3_output_0", "Shape5320", "Rank5322", "BinaryOp5324", "Unsqueeze5325", "BinaryOp5327", "Unsqueeze5328", "StridedSlice5331", "Squeeze5332", "BinaryOp5333", "BinaryOp5334", "/blocks.12/self_attn/Gather_3_output_0", "/blocks.12/self_attn/Div_1_output_0", "/blocks.12/self_attn/Unsqueeze_9_output_0", "/blocks.12/self_attn/Slice_3_output_0", "/blocks.12/self_attn/Neg_1_output_0", "/blocks.12/self_attn/Unsqueeze_8_output_0", "/blocks.12/self_attn/Slice_2_output_0", "/blocks.12/self_attn/Concat_4_output_0", "/blocks.12/self_attn/Mul_3_output_0", "/blocks.12/self_attn/Add_1_output_0", "/blocks.12/self_attn/v_proj/FakeLinear_output_0", "/blocks.12/self_attn/Unsqueeze_4_output_0", "/blocks.12/self_attn/Unsqueeze_5_output_0", "/blocks.12/self_attn/Concat_2_output_0", "/blocks.12/self_attn/Reshape_2_output_0", "Unsqueeze5543", "Unsqueeze5546", "StridedSlice5549", "Squeeze5550", "BinaryOp5551", "BinaryOp5552", "/Gather_25_output_0", "/blocks.12/self_attn/Reshape_7_output_0", "/blocks.12/self_attn/o_proj/FakeLinear_output_0", "/blocks.12/post_attention_layernorm/Cast_output_0", "/blocks.12/post_attention_layernorm/Mul_1_output_0", "/blocks.12/Add_output_0", "/blocks.12/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.12/mlp/gate_proj/FakeLinear_output_0", "/blocks.12/mlp/act_fn/Mul_output_0", "/blocks.12/mlp/act_fn/Mul_1_output_0", "/blocks.12/mlp/act_fn/Mul_2_output_0", "/blocks.12/mlp/act_fn/Add_output_0", "/blocks.12/mlp/act_fn/Mul_3_output_0", "/blocks.12/mlp/act_fn/Tanh_output_0", "/blocks.12/mlp/act_fn/Add_1_output_0", "/blocks.12/mlp/act_fn/Mul_4_output_0", "/blocks.12/mlp/act_fn/Mul_5_output_0", "/blocks.12/mlp/up_proj/FakeLinear_output_0", "/blocks.12/mlp/Mul_output_0", "/blocks.12/mlp/down_proj/FakeLinear_output_0", "/blocks.12/post_feedforward_layernorm/Cast_output_0", "/blocks.12/post_feedforward_layernorm/Mul_1_output_0", "/blocks.12/Add_1_output_0", "/blocks.13/Reshape_output_0", "/blocks.13/input_layernorm/Mul_1_output_0", "/blocks.13/self_attn/q_proj/FakeLinear_output_0", "/blocks.13/self_attn/Shape_output_0", "Shape5703", "Rank5705", "BinaryOp5707", "Unsqueeze5708", "BinaryOp5710", "Unsqueeze5711", "StridedSlice5714", "Squeeze5715", "BinaryOp5717", "/blocks.13/self_attn/Gather_output_0", "/blocks.13/self_attn/Unsqueeze_output_0", "Unsqueeze5725", "Unsqueeze5728", "StridedSlice5731", "Squeeze5732", "BinaryOp5733", "BinaryOp5734", "/blocks.13/self_attn/Gather_1_output_0", "/blocks.13/self_attn/Unsqueeze_1_output_0", "/blocks.13/self_attn/Concat_output_0", "/blocks.13/self_attn/Reshape_output_0", "/blocks.13/self_attn/q_norm/Cast_output_0", "/blocks.13/self_attn/q_norm/Mul_1_output_0", "/blocks.13/self_attn/Mul_output_0", "/blocks.13/self_attn/Shape_2_output_0", "Shape5852", "Rank5854", "BinaryOp5856", "Unsqueeze5857", "BinaryOp5859", "Unsqueeze5860", "StridedSlice5863", "Squeeze5864", "BinaryOp5865", "BinaryOp5866", "/blocks.13/self_attn/Gather_2_output_0", "/blocks.13/self_attn/Div_output_0", "/blocks.13/self_attn/Unsqueeze_7_output_0", "/blocks.13/self_attn/Slice_1_output_0", "/blocks.13/self_attn/Neg_output_0", "/blocks.13/self_attn/Unsqueeze_6_output_0", "/blocks.13/self_attn/Slice_output_0", "/blocks.13/self_attn/Concat_3_output_0", "/blocks.13/self_attn/Mul_1_output_0", "/blocks.13/self_attn/Add_output_0", "/blocks.13/self_attn/k_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_2_output_0", "/blocks.13/self_attn/Unsqueeze_3_output_0", "/blocks.13/self_attn/Concat_1_output_0", "/blocks.13/self_attn/Reshape_1_output_0", "/blocks.13/self_attn/k_norm/Cast_output_0", "/blocks.13/self_attn/k_norm/Mul_1_output_0", "/blocks.13/self_attn/Mul_2_output_0", "/blocks.13/self_attn/Shape_3_output_0", "Shape5750", "Rank5752", "BinaryOp5754", "Unsqueeze5755", "BinaryOp5757", "Unsqueeze5758", "StridedSlice5761", "Squeeze5762", "BinaryOp5763", "BinaryOp5764", "/blocks.13/self_attn/Gather_3_output_0", "/blocks.13/self_attn/Div_1_output_0", "/blocks.13/self_attn/Unsqueeze_9_output_0", "/blocks.13/self_attn/Slice_3_output_0", "/blocks.13/self_attn/Neg_1_output_0", "/blocks.13/self_attn/Unsqueeze_8_output_0", "/blocks.13/self_attn/Slice_2_output_0", "/blocks.13/self_attn/Concat_4_output_0", "/blocks.13/self_attn/Mul_3_output_0", "/blocks.13/self_attn/Add_1_output_0", "/blocks.13/self_attn/v_proj/FakeLinear_output_0", "/blocks.13/self_attn/Unsqueeze_4_output_0", "/blocks.13/self_attn/Unsqueeze_5_output_0", "/blocks.13/self_attn/Concat_2_output_0", "/blocks.13/self_attn/Reshape_2_output_0", "Unsqueeze5973", "Unsqueeze5976", "StridedSlice5979", "Squeeze5980", "BinaryOp5981", "BinaryOp5982", "/Gather_27_output_0", "/blocks.13/self_attn/Reshape_7_output_0", "/blocks.13/self_attn/o_proj/FakeLinear_output_0", "/blocks.13/post_attention_layernorm/Cast_output_0", "/blocks.13/post_attention_layernorm/Mul_1_output_0", "/blocks.13/Add_output_0", "/blocks.13/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.13/mlp/gate_proj/FakeLinear_output_0", "/blocks.13/mlp/act_fn/Mul_output_0", "/blocks.13/mlp/act_fn/Mul_1_output_0", "/blocks.13/mlp/act_fn/Mul_2_output_0", "/blocks.13/mlp/act_fn/Add_output_0", "/blocks.13/mlp/act_fn/Mul_3_output_0", "/blocks.13/mlp/act_fn/Tanh_output_0", "/blocks.13/mlp/act_fn/Add_1_output_0", "/blocks.13/mlp/act_fn/Mul_4_output_0", "/blocks.13/mlp/act_fn/Mul_5_output_0", "/blocks.13/mlp/up_proj/FakeLinear_output_0", "/blocks.13/mlp/Mul_output_0", "/blocks.13/mlp/down_proj/FakeLinear_output_0", "/blocks.13/post_feedforward_layernorm/Cast_output_0", "/blocks.13/post_feedforward_layernorm/Mul_1_output_0", "/blocks.13/Add_1_output_0", "/blocks.14/Reshape_output_0", "/blocks.14/input_layernorm/Mul_1_output_0", "/blocks.14/self_attn/q_proj/FakeLinear_output_0", "/blocks.14/self_attn/Shape_output_0", "Shape6133", "Rank6135", "BinaryOp6137", "Unsqueeze6138", "BinaryOp6140", "Unsqueeze6141", "StridedSlice6144", "Squeeze6145", "BinaryOp6147", "/blocks.14/self_attn/Gather_output_0", "/blocks.14/self_attn/Unsqueeze_output_0", "Unsqueeze6155", "Unsqueeze6158", "StridedSlice6161", "Squeeze6162", "BinaryOp6163", "BinaryOp6164", "/blocks.14/self_attn/Gather_1_output_0", "/blocks.14/self_attn/Unsqueeze_1_output_0", "/blocks.14/self_attn/Concat_output_0", "/blocks.14/self_attn/Reshape_output_0", "/blocks.14/self_attn/q_norm/Cast_output_0", "/blocks.14/self_attn/q_norm/Mul_1_output_0", "/blocks.14/self_attn/Mul_output_0", "/blocks.14/self_attn/Shape_2_output_0", "Shape6282", "Rank6284", "BinaryOp6286", "Unsqueeze6287", "BinaryOp6289", "Unsqueeze6290", "StridedSlice6293", "Squeeze6294", "BinaryOp6295", "BinaryOp6296", "/blocks.14/self_attn/Gather_2_output_0", "/blocks.14/self_attn/Div_output_0", "/blocks.14/self_attn/Unsqueeze_7_output_0", "/blocks.14/self_attn/Slice_1_output_0", "/blocks.14/self_attn/Neg_output_0", "/blocks.14/self_attn/Unsqueeze_6_output_0", "/blocks.14/self_attn/Slice_output_0", "/blocks.14/self_attn/Concat_3_output_0", "/blocks.14/self_attn/Mul_1_output_0", "/blocks.14/self_attn/Add_output_0", "/blocks.14/self_attn/k_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_2_output_0", "/blocks.14/self_attn/Unsqueeze_3_output_0", "/blocks.14/self_attn/Concat_1_output_0", "/blocks.14/self_attn/Reshape_1_output_0", "/blocks.14/self_attn/k_norm/Cast_output_0", "/blocks.14/self_attn/k_norm/Mul_1_output_0", "/blocks.14/self_attn/Mul_2_output_0", "/blocks.14/self_attn/Shape_3_output_0", "Shape6180", "Rank6182", "BinaryOp6184", "Unsqueeze6185", "BinaryOp6187", "Unsqueeze6188", "StridedSlice6191", "Squeeze6192", "BinaryOp6193", "BinaryOp6194", "/blocks.14/self_attn/Gather_3_output_0", "/blocks.14/self_attn/Div_1_output_0", "/blocks.14/self_attn/Unsqueeze_9_output_0", "/blocks.14/self_attn/Slice_3_output_0", "/blocks.14/self_attn/Neg_1_output_0", "/blocks.14/self_attn/Unsqueeze_8_output_0", "/blocks.14/self_attn/Slice_2_output_0", "/blocks.14/self_attn/Concat_4_output_0", "/blocks.14/self_attn/Mul_3_output_0", "/blocks.14/self_attn/Add_1_output_0", "/blocks.14/self_attn/v_proj/FakeLinear_output_0", "/blocks.14/self_attn/Unsqueeze_4_output_0", "/blocks.14/self_attn/Unsqueeze_5_output_0", "/blocks.14/self_attn/Concat_2_output_0", "/blocks.14/self_attn/Reshape_2_output_0", "Unsqueeze6403", "Unsqueeze6406", "StridedSlice6409", "Squeeze6410", "BinaryOp6411", "BinaryOp6412", "/Gather_29_output_0", "/blocks.14/self_attn/Reshape_7_output_0", "/blocks.14/self_attn/o_proj/FakeLinear_output_0", "/blocks.14/post_attention_layernorm/Cast_output_0", "/blocks.14/post_attention_layernorm/Mul_1_output_0", "/blocks.14/Add_output_0", "/blocks.14/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.14/mlp/gate_proj/FakeLinear_output_0", "/blocks.14/mlp/act_fn/Mul_output_0", "/blocks.14/mlp/act_fn/Mul_1_output_0", "/blocks.14/mlp/act_fn/Mul_2_output_0", "/blocks.14/mlp/act_fn/Add_output_0", "/blocks.14/mlp/act_fn/Mul_3_output_0", "/blocks.14/mlp/act_fn/Tanh_output_0", "/blocks.14/mlp/act_fn/Add_1_output_0", "/blocks.14/mlp/act_fn/Mul_4_output_0", "/blocks.14/mlp/act_fn/Mul_5_output_0", "/blocks.14/mlp/up_proj/FakeLinear_output_0", "/blocks.14/mlp/Mul_output_0", "/blocks.14/mlp/down_proj/FakeLinear_output_0", "/blocks.14/post_feedforward_layernorm/Cast_output_0", "/blocks.14/post_feedforward_layernorm/Mul_1_output_0", "/blocks.14/Add_1_output_0", "/blocks.15/Reshape_output_0", "/blocks.15/input_layernorm/Mul_1_output_0", "/blocks.15/self_attn/q_proj/FakeLinear_output_0", "/blocks.15/self_attn/Shape_output_0", "Shape6563", "Rank6565", "BinaryOp6567", "Unsqueeze6568", "BinaryOp6570", "Unsqueeze6571", "StridedSlice6574", "Squeeze6575", "BinaryOp6577", "/blocks.15/self_attn/Gather_output_0", "/blocks.15/self_attn/Unsqueeze_output_0", "Unsqueeze6585", "Unsqueeze6588", "StridedSlice6591", "Squeeze6592", "BinaryOp6593", "BinaryOp6594", "/blocks.15/self_attn/Gather_1_output_0", "/blocks.15/self_attn/Unsqueeze_1_output_0", "/blocks.15/self_attn/Concat_output_0", "/blocks.15/self_attn/Reshape_output_0", "/blocks.15/self_attn/q_norm/Cast_output_0", "/blocks.15/self_attn/q_norm/Mul_1_output_0", "/blocks.15/self_attn/Mul_output_0", "/blocks.15/self_attn/Shape_2_output_0", "Shape6712", "Rank6714", "BinaryOp6716", "Unsqueeze6717", "BinaryOp6719", "Unsqueeze6720", "StridedSlice6723", "Squeeze6724", "BinaryOp6725", "BinaryOp6726", "/blocks.15/self_attn/Gather_2_output_0", "/blocks.15/self_attn/Div_output_0", "/blocks.15/self_attn/Unsqueeze_7_output_0", "/blocks.15/self_attn/Slice_1_output_0", "/blocks.15/self_attn/Neg_output_0", "/blocks.15/self_attn/Unsqueeze_6_output_0", "/blocks.15/self_attn/Slice_output_0", "/blocks.15/self_attn/Concat_3_output_0", "/blocks.15/self_attn/Mul_1_output_0", "/blocks.15/self_attn/Add_output_0", "/blocks.15/self_attn/k_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_2_output_0", "/blocks.15/self_attn/Unsqueeze_3_output_0", "/blocks.15/self_attn/Concat_1_output_0", "/blocks.15/self_attn/Reshape_1_output_0", "/blocks.15/self_attn/k_norm/Cast_output_0", "/blocks.15/self_attn/k_norm/Mul_1_output_0", "/blocks.15/self_attn/Mul_2_output_0", "/blocks.15/self_attn/Shape_3_output_0", "Shape6610", "Rank6612", "BinaryOp6614", "Unsqueeze6615", "BinaryOp6617", "Unsqueeze6618", "StridedSlice6621", "Squeeze6622", "BinaryOp6623", "BinaryOp6624", "/blocks.15/self_attn/Gather_3_output_0", "/blocks.15/self_attn/Div_1_output_0", "/blocks.15/self_attn/Unsqueeze_9_output_0", "/blocks.15/self_attn/Slice_3_output_0", "/blocks.15/self_attn/Neg_1_output_0", "/blocks.15/self_attn/Unsqueeze_8_output_0", "/blocks.15/self_attn/Slice_2_output_0", "/blocks.15/self_attn/Concat_4_output_0", "/blocks.15/self_attn/Mul_3_output_0", "/blocks.15/self_attn/Add_1_output_0", "/blocks.15/self_attn/v_proj/FakeLinear_output_0", "/blocks.15/self_attn/Unsqueeze_4_output_0", "/blocks.15/self_attn/Unsqueeze_5_output_0", "/blocks.15/self_attn/Concat_2_output_0", "/blocks.15/self_attn/Reshape_2_output_0", "Unsqueeze6833", "Unsqueeze6836", "StridedSlice6839", "Squeeze6840", "BinaryOp6841", "BinaryOp6842", "/Gather_31_output_0", "/blocks.15/self_attn/Reshape_7_output_0", "/blocks.15/self_attn/o_proj/FakeLinear_output_0", "/blocks.15/post_attention_layernorm/Cast_output_0", "/blocks.15/post_attention_layernorm/Mul_1_output_0", "/blocks.15/Add_output_0", "/blocks.15/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.15/mlp/gate_proj/FakeLinear_output_0", "/blocks.15/mlp/act_fn/Mul_output_0", "/blocks.15/mlp/act_fn/Mul_1_output_0", "/blocks.15/mlp/act_fn/Mul_2_output_0", "/blocks.15/mlp/act_fn/Add_output_0", "/blocks.15/mlp/act_fn/Mul_3_output_0", "/blocks.15/mlp/act_fn/Tanh_output_0", "/blocks.15/mlp/act_fn/Add_1_output_0", "/blocks.15/mlp/act_fn/Mul_4_output_0", "/blocks.15/mlp/act_fn/Mul_5_output_0", "/blocks.15/mlp/up_proj/FakeLinear_output_0", "/blocks.15/mlp/Mul_output_0", "/blocks.15/mlp/down_proj/FakeLinear_output_0", "/blocks.15/post_feedforward_layernorm/Cast_output_0", "/blocks.15/post_feedforward_layernorm/Mul_1_output_0", "/blocks.15/Add_1_output_0", "/blocks.16/Reshape_output_0", "/blocks.16/input_layernorm/Mul_1_output_0", "/blocks.16/self_attn/q_proj/FakeLinear_output_0", "/blocks.16/self_attn/Shape_output_0", "Shape6993", "Rank6995", "BinaryOp6997", "Unsqueeze6998", "BinaryOp7000", "Unsqueeze7001", "StridedSlice7004", "Squeeze7005", "BinaryOp7007", "/blocks.16/self_attn/Gather_output_0", "/blocks.16/self_attn/Unsqueeze_output_0", "Unsqueeze7015", "Unsqueeze7018", "StridedSlice7021", "Squeeze7022", "BinaryOp7023", "BinaryOp7024", "/blocks.16/self_attn/Gather_1_output_0", "/blocks.16/self_attn/Unsqueeze_1_output_0", "/blocks.16/self_attn/Concat_output_0", "/blocks.16/self_attn/Reshape_output_0", "/blocks.16/self_attn/q_norm/Cast_output_0", "/blocks.16/self_attn/q_norm/Mul_1_output_0", "/blocks.16/self_attn/Mul_output_0", "/blocks.16/self_attn/Shape_2_output_0", "Shape7142", "Rank7144", "BinaryOp7146", "Unsqueeze7147", "BinaryOp7149", "Unsqueeze7150", "StridedSlice7153", "Squeeze7154", "BinaryOp7155", "BinaryOp7156", "/blocks.16/self_attn/Gather_2_output_0", "/blocks.16/self_attn/Div_output_0", "/blocks.16/self_attn/Unsqueeze_7_output_0", "/blocks.16/self_attn/Slice_1_output_0", "/blocks.16/self_attn/Neg_output_0", "/blocks.16/self_attn/Unsqueeze_6_output_0", "/blocks.16/self_attn/Slice_output_0", "/blocks.16/self_attn/Concat_3_output_0", "/blocks.16/self_attn/Mul_1_output_0", "/blocks.16/self_attn/Add_output_0", "/blocks.16/self_attn/k_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_2_output_0", "/blocks.16/self_attn/Unsqueeze_3_output_0", "/blocks.16/self_attn/Concat_1_output_0", "/blocks.16/self_attn/Reshape_1_output_0", "/blocks.16/self_attn/k_norm/Cast_output_0", "/blocks.16/self_attn/k_norm/Mul_1_output_0", "/blocks.16/self_attn/Mul_2_output_0", "/blocks.16/self_attn/Shape_3_output_0", "Shape7040", "Rank7042", "BinaryOp7044", "Unsqueeze7045", "BinaryOp7047", "Unsqueeze7048", "StridedSlice7051", "Squeeze7052", "BinaryOp7053", "BinaryOp7054", "/blocks.16/self_attn/Gather_3_output_0", "/blocks.16/self_attn/Div_1_output_0", "/blocks.16/self_attn/Unsqueeze_9_output_0", "/blocks.16/self_attn/Slice_3_output_0", "/blocks.16/self_attn/Neg_1_output_0", "/blocks.16/self_attn/Unsqueeze_8_output_0", "/blocks.16/self_attn/Slice_2_output_0", "/blocks.16/self_attn/Concat_4_output_0", "/blocks.16/self_attn/Mul_3_output_0", "/blocks.16/self_attn/Add_1_output_0", "/blocks.16/self_attn/v_proj/FakeLinear_output_0", "/blocks.16/self_attn/Unsqueeze_4_output_0", "/blocks.16/self_attn/Unsqueeze_5_output_0", "/blocks.16/self_attn/Concat_2_output_0", "/blocks.16/self_attn/Reshape_2_output_0", "Unsqueeze7263", "Unsqueeze7266", "StridedSlice7269", "Squeeze7270", "BinaryOp7271", "BinaryOp7272", "/Gather_33_output_0", "/blocks.16/self_attn/Reshape_7_output_0", "/blocks.16/self_attn/o_proj/FakeLinear_output_0", "/blocks.16/post_attention_layernorm/Cast_output_0", "/blocks.16/post_attention_layernorm/Mul_1_output_0", "/blocks.16/Add_output_0", "/blocks.16/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.16/mlp/gate_proj/FakeLinear_output_0", "/blocks.16/mlp/act_fn/Mul_output_0", "/blocks.16/mlp/act_fn/Mul_1_output_0", "/blocks.16/mlp/act_fn/Mul_2_output_0", "/blocks.16/mlp/act_fn/Add_output_0", "/blocks.16/mlp/act_fn/Mul_3_output_0", "/blocks.16/mlp/act_fn/Tanh_output_0", "/blocks.16/mlp/act_fn/Add_1_output_0", "/blocks.16/mlp/act_fn/Mul_4_output_0", "/blocks.16/mlp/act_fn/Mul_5_output_0", "/blocks.16/mlp/up_proj/FakeLinear_output_0", "/blocks.16/mlp/Mul_output_0", "/blocks.16/mlp/down_proj/FakeLinear_output_0", "/blocks.16/post_feedforward_layernorm/Cast_output_0", "/blocks.16/post_feedforward_layernorm/Mul_1_output_0", "/blocks.16/Add_1_output_0", "/blocks.17/Reshape_output_0", "/blocks.17/input_layernorm/Mul_1_output_0", "/blocks.17/self_attn/q_proj/FakeLinear_output_0", "/blocks.17/self_attn/Shape_output_0", "Shape7423", "Rank7425", "BinaryOp7427", "Unsqueeze7428", "BinaryOp7430", "Unsqueeze7431", "StridedSlice7434", "Squeeze7435", "BinaryOp7437", "/blocks.17/self_attn/Gather_output_0", "/blocks.17/self_attn/Unsqueeze_output_0", "Unsqueeze7445", "Unsqueeze7448", "StridedSlice7451", "Squeeze7452", "BinaryOp7453", "BinaryOp7454", "/blocks.17/self_attn/Gather_1_output_0", "/blocks.17/self_attn/Unsqueeze_1_output_0", "/blocks.17/self_attn/Concat_output_0", "/blocks.17/self_attn/Reshape_output_0", "/blocks.17/self_attn/q_norm/Cast_output_0", "/blocks.17/self_attn/q_norm/Mul_1_output_0", "/blocks.17/self_attn/Mul_output_0", "/blocks.17/self_attn/Shape_2_output_0", "Shape7572", "Rank7574", "BinaryOp7576", "Unsqueeze7577", "BinaryOp7579", "Unsqueeze7580", "StridedSlice7583", "Squeeze7584", "BinaryOp7585", "BinaryOp7586", "/blocks.17/self_attn/Gather_2_output_0", "/blocks.17/self_attn/Div_output_0", "/blocks.17/self_attn/Unsqueeze_7_output_0", "/blocks.17/self_attn/Slice_1_output_0", "/blocks.17/self_attn/Neg_output_0", "/blocks.17/self_attn/Unsqueeze_6_output_0", "/blocks.17/self_attn/Slice_output_0", "/blocks.17/self_attn/Concat_3_output_0", "/blocks.17/self_attn/Mul_1_output_0", "/blocks.17/self_attn/Add_output_0", "/blocks.17/self_attn/k_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_2_output_0", "/blocks.17/self_attn/Unsqueeze_3_output_0", "/blocks.17/self_attn/Concat_1_output_0", "/blocks.17/self_attn/Reshape_1_output_0", "/blocks.17/self_attn/k_norm/Cast_output_0", "/blocks.17/self_attn/k_norm/Mul_1_output_0", "/blocks.17/self_attn/Mul_2_output_0", "/blocks.17/self_attn/Shape_3_output_0", "Shape7470", "Rank7472", "BinaryOp7474", "Unsqueeze7475", "BinaryOp7477", "Unsqueeze7478", "StridedSlice7481", "Squeeze7482", "BinaryOp7483", "BinaryOp7484", "/blocks.17/self_attn/Gather_3_output_0", "/blocks.17/self_attn/Div_1_output_0", "/blocks.17/self_attn/Unsqueeze_9_output_0", "/blocks.17/self_attn/Slice_3_output_0", "/blocks.17/self_attn/Neg_1_output_0", "/blocks.17/self_attn/Unsqueeze_8_output_0", "/blocks.17/self_attn/Slice_2_output_0", "/blocks.17/self_attn/Concat_4_output_0", "/blocks.17/self_attn/Mul_3_output_0", "/blocks.17/self_attn/Add_1_output_0", "/blocks.17/self_attn/v_proj/FakeLinear_output_0", "/blocks.17/self_attn/Unsqueeze_4_output_0", "/blocks.17/self_attn/Unsqueeze_5_output_0", "/blocks.17/self_attn/Concat_2_output_0", "/blocks.17/self_attn/Reshape_2_output_0", "Unsqueeze7693", "Unsqueeze7696", "StridedSlice7699", "Squeeze7700", "BinaryOp7702", "/Gather_35_output_0", "/blocks.17/self_attn/Reshape_7_output_0", "/blocks.17/self_attn/o_proj/FakeLinear_output_0", "/blocks.17/post_attention_layernorm/Cast_output_0", "/blocks.17/post_attention_layernorm/Mul_1_output_0", "/blocks.17/Add_output_0", "/blocks.17/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.17/mlp/gate_proj/FakeLinear_output_0", "/blocks.17/mlp/act_fn/Mul_output_0", "/blocks.17/mlp/act_fn/Mul_1_output_0", "/blocks.17/mlp/act_fn/Mul_2_output_0", "/blocks.17/mlp/act_fn/Add_output_0", "/blocks.17/mlp/act_fn/Mul_3_output_0", "/blocks.17/mlp/act_fn/Tanh_output_0", "/blocks.17/mlp/act_fn/Add_1_output_0", "/blocks.17/mlp/act_fn/Mul_4_output_0", "/blocks.17/mlp/act_fn/Mul_5_output_0", "/blocks.17/mlp/up_proj/FakeLinear_output_0", "/blocks.17/mlp/Mul_output_0", "/blocks.17/mlp/down_proj/FakeLinear_output_0", "/blocks.17/post_feedforward_layernorm/Cast_output_0", "/blocks.17/post_feedforward_layernorm/Mul_1_output_0", "/blocks.17/Add_1_output_0", "/blocks.18/Reshape_output_0", "/blocks.18/input_layernorm/Mul_1_output_0", "/blocks.18/self_attn/q_proj/FakeLinear_output_0", "/blocks.18/self_attn/Shape_output_0", "Shape7853", "Rank7855", "BinaryOp7857", "Unsqueeze7858", "BinaryOp7860", "Unsqueeze7861", "StridedSlice7864", "Squeeze7865", "BinaryOp7867", "/blocks.18/self_attn/Gather_output_0", "/blocks.18/self_attn/Unsqueeze_output_0", "Unsqueeze7875", "Unsqueeze7878", "StridedSlice7881", "Squeeze7882", "BinaryOp7883", "BinaryOp7884", "/blocks.18/self_attn/Gather_1_output_0", "/blocks.18/self_attn/Unsqueeze_1_output_0", "/blocks.18/self_attn/Concat_output_0", "/blocks.18/self_attn/Reshape_output_0", "/blocks.18/self_attn/q_norm/Cast_output_0", "/blocks.18/self_attn/q_norm/Mul_1_output_0", "/blocks.18/self_attn/Mul_output_0", "/blocks.18/self_attn/Shape_2_output_0", "Shape8002", "Rank8004", "BinaryOp8006", "Unsqueeze8007", "BinaryOp8009", "Unsqueeze8010", "StridedSlice8013", "Squeeze8014", "BinaryOp8015", "BinaryOp8016", "/blocks.18/self_attn/Gather_2_output_0", "/blocks.18/self_attn/Div_output_0", "/blocks.18/self_attn/Unsqueeze_7_output_0", "/blocks.18/self_attn/Slice_1_output_0", "/blocks.18/self_attn/Neg_output_0", "/blocks.18/self_attn/Unsqueeze_6_output_0", "/blocks.18/self_attn/Slice_output_0", "/blocks.18/self_attn/Concat_3_output_0", "/blocks.18/self_attn/Mul_1_output_0", "/blocks.18/self_attn/Add_output_0", "/blocks.18/self_attn/k_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_2_output_0", "/blocks.18/self_attn/Unsqueeze_3_output_0", "/blocks.18/self_attn/Concat_1_output_0", "/blocks.18/self_attn/Reshape_1_output_0", "/blocks.18/self_attn/k_norm/Cast_output_0", "/blocks.18/self_attn/k_norm/Mul_1_output_0", "/blocks.18/self_attn/Mul_2_output_0", "/blocks.18/self_attn/Shape_3_output_0", "Shape7900", "Rank7902", "BinaryOp7904", "Unsqueeze7905", "BinaryOp7907", "Unsqueeze7908", "StridedSlice7911", "Squeeze7912", "BinaryOp7913", "BinaryOp7914", "/blocks.18/self_attn/Gather_3_output_0", "/blocks.18/self_attn/Div_1_output_0", "/blocks.18/self_attn/Unsqueeze_9_output_0", "/blocks.18/self_attn/Slice_3_output_0", "/blocks.18/self_attn/Neg_1_output_0", "/blocks.18/self_attn/Unsqueeze_8_output_0", "/blocks.18/self_attn/Slice_2_output_0", "/blocks.18/self_attn/Concat_4_output_0", "/blocks.18/self_attn/Mul_3_output_0", "/blocks.18/self_attn/Add_1_output_0", "/blocks.18/self_attn/v_proj/FakeLinear_output_0", "/blocks.18/self_attn/Unsqueeze_4_output_0", "/blocks.18/self_attn/Unsqueeze_5_output_0", "/blocks.18/self_attn/Concat_2_output_0", "/blocks.18/self_attn/Reshape_2_output_0", "Unsqueeze8123", "Unsqueeze8126", "StridedSlice8129", "Squeeze8130", "BinaryOp8131", "BinaryOp8132", "/Gather_37_output_0", "/blocks.18/self_attn/Reshape_7_output_0", "/blocks.18/self_attn/o_proj/FakeLinear_output_0", "/blocks.18/post_attention_layernorm/Cast_output_0", "/blocks.18/post_attention_layernorm/Mul_1_output_0", "/blocks.18/Add_output_0", "/blocks.18/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.18/mlp/gate_proj/FakeLinear_output_0", "/blocks.18/mlp/act_fn/Mul_output_0", "/blocks.18/mlp/act_fn/Mul_1_output_0", "/blocks.18/mlp/act_fn/Mul_2_output_0", "/blocks.18/mlp/act_fn/Add_output_0", "/blocks.18/mlp/act_fn/Mul_3_output_0", "/blocks.18/mlp/act_fn/Tanh_output_0", "/blocks.18/mlp/act_fn/Add_1_output_0", "/blocks.18/mlp/act_fn/Mul_4_output_0", "/blocks.18/mlp/act_fn/Mul_5_output_0", "/blocks.18/mlp/up_proj/FakeLinear_output_0", "/blocks.18/mlp/Mul_output_0", "/blocks.18/mlp/down_proj/FakeLinear_output_0", "/blocks.18/post_feedforward_layernorm/Cast_output_0", "/blocks.18/post_feedforward_layernorm/Mul_1_output_0", "/blocks.18/Add_1_output_0", "/blocks.19/Reshape_output_0", "/blocks.19/input_layernorm/Mul_1_output_0", "/blocks.19/self_attn/q_proj/FakeLinear_output_0", "/blocks.19/self_attn/Shape_output_0", "Shape8283", "Rank8285", "BinaryOp8287", "Unsqueeze8288", "BinaryOp8290", "Unsqueeze8291", "StridedSlice8294", "Squeeze8295", "BinaryOp8297", "/blocks.19/self_attn/Gather_output_0", "/blocks.19/self_attn/Unsqueeze_output_0", "Unsqueeze8305", "Unsqueeze8308", "StridedSlice8311", "Squeeze8312", "BinaryOp8313", "BinaryOp8314", "/blocks.19/self_attn/Gather_1_output_0", "/blocks.19/self_attn/Unsqueeze_1_output_0", "/blocks.19/self_attn/Concat_output_0", "/blocks.19/self_attn/Reshape_output_0", "/blocks.19/self_attn/q_norm/Cast_output_0", "/blocks.19/self_attn/q_norm/Mul_1_output_0", "/blocks.19/self_attn/Mul_output_0", "/blocks.19/self_attn/Shape_2_output_0", "Shape8432", "Rank8434", "BinaryOp8436", "Unsqueeze8437", "BinaryOp8439", "Unsqueeze8440", "StridedSlice8443", "Squeeze8444", "BinaryOp8445", "BinaryOp8446", "/blocks.19/self_attn/Gather_2_output_0", "/blocks.19/self_attn/Div_output_0", "/blocks.19/self_attn/Unsqueeze_7_output_0", "/blocks.19/self_attn/Slice_1_output_0", "/blocks.19/self_attn/Neg_output_0", "/blocks.19/self_attn/Unsqueeze_6_output_0", "/blocks.19/self_attn/Slice_output_0", "/blocks.19/self_attn/Concat_3_output_0", "/blocks.19/self_attn/Mul_1_output_0", "/blocks.19/self_attn/Add_output_0", "/blocks.19/self_attn/k_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_2_output_0", "/blocks.19/self_attn/Unsqueeze_3_output_0", "/blocks.19/self_attn/Concat_1_output_0", "/blocks.19/self_attn/Reshape_1_output_0", "/blocks.19/self_attn/k_norm/Cast_output_0", "/blocks.19/self_attn/k_norm/Mul_1_output_0", "/blocks.19/self_attn/Mul_2_output_0", "/blocks.19/self_attn/Shape_3_output_0", "Shape8330", "Rank8332", "BinaryOp8334", "Unsqueeze8335", "BinaryOp8337", "Unsqueeze8338", "StridedSlice8341", "Squeeze8342", "BinaryOp8343", "BinaryOp8344", "/blocks.19/self_attn/Gather_3_output_0", "/blocks.19/self_attn/Div_1_output_0", "/blocks.19/self_attn/Unsqueeze_9_output_0", "/blocks.19/self_attn/Slice_3_output_0", "/blocks.19/self_attn/Neg_1_output_0", "/blocks.19/self_attn/Unsqueeze_8_output_0", "/blocks.19/self_attn/Slice_2_output_0", "/blocks.19/self_attn/Concat_4_output_0", "/blocks.19/self_attn/Mul_3_output_0", "/blocks.19/self_attn/Add_1_output_0", "/blocks.19/self_attn/v_proj/FakeLinear_output_0", "/blocks.19/self_attn/Unsqueeze_4_output_0", "/blocks.19/self_attn/Unsqueeze_5_output_0", "/blocks.19/self_attn/Concat_2_output_0", "/blocks.19/self_attn/Reshape_2_output_0", "Unsqueeze8553", "Unsqueeze8556", "StridedSlice8559", "Squeeze8560", "BinaryOp8561", "BinaryOp8562", "/Gather_39_output_0", "/blocks.19/self_attn/Reshape_7_output_0", "/blocks.19/self_attn/o_proj/FakeLinear_output_0", "/blocks.19/post_attention_layernorm/Cast_output_0", "/blocks.19/post_attention_layernorm/Mul_1_output_0", "/blocks.19/Add_output_0", "/blocks.19/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.19/mlp/gate_proj/FakeLinear_output_0", "/blocks.19/mlp/act_fn/Mul_output_0", "/blocks.19/mlp/act_fn/Mul_1_output_0", "/blocks.19/mlp/act_fn/Mul_2_output_0", "/blocks.19/mlp/act_fn/Add_output_0", "/blocks.19/mlp/act_fn/Mul_3_output_0", "/blocks.19/mlp/act_fn/Tanh_output_0", "/blocks.19/mlp/act_fn/Add_1_output_0", "/blocks.19/mlp/act_fn/Mul_4_output_0", "/blocks.19/mlp/act_fn/Mul_5_output_0", "/blocks.19/mlp/up_proj/FakeLinear_output_0", "/blocks.19/mlp/Mul_output_0", "/blocks.19/mlp/down_proj/FakeLinear_output_0", "/blocks.19/post_feedforward_layernorm/Cast_output_0", "/blocks.19/post_feedforward_layernorm/Mul_1_output_0", "/blocks.19/Add_1_output_0", "/blocks.20/Reshape_output_0", "/blocks.20/input_layernorm/Mul_1_output_0", "/blocks.20/self_attn/q_proj/FakeLinear_output_0", "/blocks.20/self_attn/Shape_output_0", "Shape8713", "Rank8715", "BinaryOp8717", "Unsqueeze8718", "BinaryOp8720", "Unsqueeze8721", "StridedSlice8724", "Squeeze8725", "BinaryOp8727", "/blocks.20/self_attn/Gather_output_0", "/blocks.20/self_attn/Unsqueeze_output_0", "Unsqueeze8735", "Unsqueeze8738", "StridedSlice8741", "Squeeze8742", "BinaryOp8743", "BinaryOp8744", "/blocks.20/self_attn/Gather_1_output_0", "/blocks.20/self_attn/Unsqueeze_1_output_0", "/blocks.20/self_attn/Concat_output_0", "/blocks.20/self_attn/Reshape_output_0", "/blocks.20/self_attn/q_norm/Cast_output_0", "/blocks.20/self_attn/q_norm/Mul_1_output_0", "/blocks.20/self_attn/Mul_output_0", "/blocks.20/self_attn/Shape_2_output_0", "Shape8862", "Rank8864", "BinaryOp8866", "Unsqueeze8867", "BinaryOp8869", "Unsqueeze8870", "StridedSlice8873", "Squeeze8874", "BinaryOp8875", "BinaryOp8876", "/blocks.20/self_attn/Gather_2_output_0", "/blocks.20/self_attn/Div_output_0", "/blocks.20/self_attn/Unsqueeze_7_output_0", "/blocks.20/self_attn/Slice_1_output_0", "/blocks.20/self_attn/Neg_output_0", "/blocks.20/self_attn/Unsqueeze_6_output_0", "/blocks.20/self_attn/Slice_output_0", "/blocks.20/self_attn/Concat_3_output_0", "/blocks.20/self_attn/Mul_1_output_0", "/blocks.20/self_attn/Add_output_0", "/blocks.20/self_attn/k_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_2_output_0", "/blocks.20/self_attn/Unsqueeze_3_output_0", "/blocks.20/self_attn/Concat_1_output_0", "/blocks.20/self_attn/Reshape_1_output_0", "/blocks.20/self_attn/k_norm/Cast_output_0", "/blocks.20/self_attn/k_norm/Mul_1_output_0", "/blocks.20/self_attn/Mul_2_output_0", "/blocks.20/self_attn/Shape_3_output_0", "Shape8760", "Rank8762", "BinaryOp8764", "Unsqueeze8765", "BinaryOp8767", "Unsqueeze8768", "StridedSlice8771", "Squeeze8772", "BinaryOp8773", "BinaryOp8774", "/blocks.20/self_attn/Gather_3_output_0", "/blocks.20/self_attn/Div_1_output_0", "/blocks.20/self_attn/Unsqueeze_9_output_0", "/blocks.20/self_attn/Slice_3_output_0", "/blocks.20/self_attn/Neg_1_output_0", "/blocks.20/self_attn/Unsqueeze_8_output_0", "/blocks.20/self_attn/Slice_2_output_0", "/blocks.20/self_attn/Concat_4_output_0", "/blocks.20/self_attn/Mul_3_output_0", "/blocks.20/self_attn/Add_1_output_0", "/blocks.20/self_attn/v_proj/FakeLinear_output_0", "/blocks.20/self_attn/Unsqueeze_4_output_0", "/blocks.20/self_attn/Unsqueeze_5_output_0", "/blocks.20/self_attn/Concat_2_output_0", "/blocks.20/self_attn/Reshape_2_output_0", "Unsqueeze8983", "Unsqueeze8986", "StridedSlice8989", "Squeeze8990", "BinaryOp8991", "BinaryOp8992", "/Gather_41_output_0", "/blocks.20/self_attn/Reshape_7_output_0", "/blocks.20/self_attn/o_proj/FakeLinear_output_0", "/blocks.20/post_attention_layernorm/Cast_output_0", "/blocks.20/post_attention_layernorm/Mul_1_output_0", "/blocks.20/Add_output_0", "/blocks.20/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.20/mlp/gate_proj/FakeLinear_output_0", "/blocks.20/mlp/act_fn/Mul_output_0", "/blocks.20/mlp/act_fn/Mul_1_output_0", "/blocks.20/mlp/act_fn/Mul_2_output_0", "/blocks.20/mlp/act_fn/Add_output_0", "/blocks.20/mlp/act_fn/Mul_3_output_0", "/blocks.20/mlp/act_fn/Tanh_output_0", "/blocks.20/mlp/act_fn/Add_1_output_0", "/blocks.20/mlp/act_fn/Mul_4_output_0", "/blocks.20/mlp/act_fn/Mul_5_output_0", "/blocks.20/mlp/up_proj/FakeLinear_output_0", "/blocks.20/mlp/Mul_output_0", "/blocks.20/mlp/down_proj/FakeLinear_output_0", "/blocks.20/post_feedforward_layernorm/Cast_output_0", "/blocks.20/post_feedforward_layernorm/Mul_1_output_0", "/blocks.20/Add_1_output_0", "/blocks.21/Reshape_output_0", "/blocks.21/input_layernorm/Mul_1_output_0", "/blocks.21/self_attn/q_proj/FakeLinear_output_0", "/blocks.21/self_attn/Shape_output_0", "Shape9143", "Rank9145", "BinaryOp9147", "Unsqueeze9148", "BinaryOp9150", "Unsqueeze9151", "StridedSlice9154", "Squeeze9155", "BinaryOp9157", "/blocks.21/self_attn/Gather_output_0", "/blocks.21/self_attn/Unsqueeze_output_0", "Unsqueeze9165", "Unsqueeze9168", "StridedSlice9171", "Squeeze9172", "BinaryOp9173", "BinaryOp9174", "/blocks.21/self_attn/Gather_1_output_0", "/blocks.21/self_attn/Unsqueeze_1_output_0", "/blocks.21/self_attn/Concat_output_0", "/blocks.21/self_attn/Reshape_output_0", "/blocks.21/self_attn/q_norm/Cast_output_0", "/blocks.21/self_attn/q_norm/Mul_1_output_0", "/blocks.21/self_attn/Mul_output_0", "/blocks.21/self_attn/Shape_2_output_0", "Shape9292", "Rank9294", "BinaryOp9296", "Unsqueeze9297", "BinaryOp9299", "Unsqueeze9300", "StridedSlice9303", "Squeeze9304", "BinaryOp9305", "BinaryOp9306", "/blocks.21/self_attn/Gather_2_output_0", "/blocks.21/self_attn/Div_output_0", "/blocks.21/self_attn/Unsqueeze_7_output_0", "/blocks.21/self_attn/Slice_1_output_0", "/blocks.21/self_attn/Neg_output_0", "/blocks.21/self_attn/Unsqueeze_6_output_0", "/blocks.21/self_attn/Slice_output_0", "/blocks.21/self_attn/Concat_3_output_0", "/blocks.21/self_attn/Mul_1_output_0", "/blocks.21/self_attn/Add_output_0", "/blocks.21/self_attn/k_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_2_output_0", "/blocks.21/self_attn/Unsqueeze_3_output_0", "/blocks.21/self_attn/Concat_1_output_0", "/blocks.21/self_attn/Reshape_1_output_0", "/blocks.21/self_attn/k_norm/Cast_output_0", "/blocks.21/self_attn/k_norm/Mul_1_output_0", "/blocks.21/self_attn/Mul_2_output_0", "/blocks.21/self_attn/Shape_3_output_0", "Shape9190", "Rank9192", "BinaryOp9194", "Unsqueeze9195", "BinaryOp9197", "Unsqueeze9198", "StridedSlice9201", "Squeeze9202", "BinaryOp9203", "BinaryOp9204", "/blocks.21/self_attn/Gather_3_output_0", "/blocks.21/self_attn/Div_1_output_0", "/blocks.21/self_attn/Unsqueeze_9_output_0", "/blocks.21/self_attn/Slice_3_output_0", "/blocks.21/self_attn/Neg_1_output_0", "/blocks.21/self_attn/Unsqueeze_8_output_0", "/blocks.21/self_attn/Slice_2_output_0", "/blocks.21/self_attn/Concat_4_output_0", "/blocks.21/self_attn/Mul_3_output_0", "/blocks.21/self_attn/Add_1_output_0", "/blocks.21/self_attn/v_proj/FakeLinear_output_0", "/blocks.21/self_attn/Unsqueeze_4_output_0", "/blocks.21/self_attn/Unsqueeze_5_output_0", "/blocks.21/self_attn/Concat_2_output_0", "/blocks.21/self_attn/Reshape_2_output_0", "Unsqueeze9413", "Unsqueeze9416", "StridedSlice9419", "Squeeze9420", "BinaryOp9421", "BinaryOp9422", "/Gather_43_output_0", "/blocks.21/self_attn/Reshape_7_output_0", "/blocks.21/self_attn/o_proj/FakeLinear_output_0", "/blocks.21/post_attention_layernorm/Cast_output_0", "/blocks.21/post_attention_layernorm/Mul_1_output_0", "/blocks.21/Add_output_0", "/blocks.21/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.21/mlp/gate_proj/FakeLinear_output_0", "/blocks.21/mlp/act_fn/Mul_output_0", "/blocks.21/mlp/act_fn/Mul_1_output_0", "/blocks.21/mlp/act_fn/Mul_2_output_0", "/blocks.21/mlp/act_fn/Add_output_0", "/blocks.21/mlp/act_fn/Mul_3_output_0", "/blocks.21/mlp/act_fn/Tanh_output_0", "/blocks.21/mlp/act_fn/Add_1_output_0", "/blocks.21/mlp/act_fn/Mul_4_output_0", "/blocks.21/mlp/act_fn/Mul_5_output_0", "/blocks.21/mlp/up_proj/FakeLinear_output_0", "/blocks.21/mlp/Mul_output_0", "/blocks.21/mlp/down_proj/FakeLinear_output_0", "/blocks.21/post_feedforward_layernorm/Cast_output_0", "/blocks.21/post_feedforward_layernorm/Mul_1_output_0", "/blocks.21/Add_1_output_0", "/blocks.22/Reshape_output_0", "/blocks.22/input_layernorm/Mul_1_output_0", "/blocks.22/self_attn/q_proj/FakeLinear_output_0", "/blocks.22/self_attn/Shape_output_0", "Shape9573", "Rank9575", "BinaryOp9577", "Unsqueeze9578", "BinaryOp9580", "Unsqueeze9581", "StridedSlice9584", "Squeeze9585", "BinaryOp9587", "/blocks.22/self_attn/Gather_output_0", "/blocks.22/self_attn/Unsqueeze_output_0", "Unsqueeze9595", "Unsqueeze9598", "StridedSlice9601", "Squeeze9602", "BinaryOp9603", "BinaryOp9604", "/blocks.22/self_attn/Gather_1_output_0", "/blocks.22/self_attn/Unsqueeze_1_output_0", "/blocks.22/self_attn/Concat_output_0", "/blocks.22/self_attn/Reshape_output_0", "/blocks.22/self_attn/q_norm/Cast_output_0", "/blocks.22/self_attn/q_norm/Mul_1_output_0", "/blocks.22/self_attn/Mul_output_0", "/blocks.22/self_attn/Shape_2_output_0", "Shape9722", "Rank9724", "BinaryOp9726", "Unsqueeze9727", "BinaryOp9729", "Unsqueeze9730", "StridedSlice9733", "Squeeze9734", "BinaryOp9735", "BinaryOp9736", "/blocks.22/self_attn/Gather_2_output_0", "/blocks.22/self_attn/Div_output_0", "/blocks.22/self_attn/Unsqueeze_7_output_0", "/blocks.22/self_attn/Slice_1_output_0", "/blocks.22/self_attn/Neg_output_0", "/blocks.22/self_attn/Unsqueeze_6_output_0", "/blocks.22/self_attn/Slice_output_0", "/blocks.22/self_attn/Concat_3_output_0", "/blocks.22/self_attn/Mul_1_output_0", "/blocks.22/self_attn/Add_output_0", "/blocks.22/self_attn/k_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_2_output_0", "/blocks.22/self_attn/Unsqueeze_3_output_0", "/blocks.22/self_attn/Concat_1_output_0", "/blocks.22/self_attn/Reshape_1_output_0", "/blocks.22/self_attn/k_norm/Cast_output_0", "/blocks.22/self_attn/k_norm/Mul_1_output_0", "/blocks.22/self_attn/Mul_2_output_0", "/blocks.22/self_attn/Shape_3_output_0", "Shape9620", "Rank9622", "BinaryOp9624", "Unsqueeze9625", "BinaryOp9627", "Unsqueeze9628", "StridedSlice9631", "Squeeze9632", "BinaryOp9633", "BinaryOp9634", "/blocks.22/self_attn/Gather_3_output_0", "/blocks.22/self_attn/Div_1_output_0", "/blocks.22/self_attn/Unsqueeze_9_output_0", "/blocks.22/self_attn/Slice_3_output_0", "/blocks.22/self_attn/Neg_1_output_0", "/blocks.22/self_attn/Unsqueeze_8_output_0", "/blocks.22/self_attn/Slice_2_output_0", "/blocks.22/self_attn/Concat_4_output_0", "/blocks.22/self_attn/Mul_3_output_0", "/blocks.22/self_attn/Add_1_output_0", "/blocks.22/self_attn/v_proj/FakeLinear_output_0", "/blocks.22/self_attn/Unsqueeze_4_output_0", "/blocks.22/self_attn/Unsqueeze_5_output_0", "/blocks.22/self_attn/Concat_2_output_0", "/blocks.22/self_attn/Reshape_2_output_0", "Unsqueeze9843", "Unsqueeze9846", "StridedSlice9849", "Squeeze9850", "BinaryOp9851", "BinaryOp9852", "/Gather_45_output_0", "/blocks.22/self_attn/Reshape_7_output_0", "/blocks.22/self_attn/o_proj/FakeLinear_output_0", "/blocks.22/post_attention_layernorm/Cast_output_0", "/blocks.22/post_attention_layernorm/Mul_1_output_0", "/blocks.22/Add_output_0", "/blocks.22/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.22/mlp/gate_proj/FakeLinear_output_0", "/blocks.22/mlp/act_fn/Mul_output_0", "/blocks.22/mlp/act_fn/Mul_1_output_0", "/blocks.22/mlp/act_fn/Mul_2_output_0", "/blocks.22/mlp/act_fn/Add_output_0", "/blocks.22/mlp/act_fn/Mul_3_output_0", "/blocks.22/mlp/act_fn/Tanh_output_0", "/blocks.22/mlp/act_fn/Add_1_output_0", "/blocks.22/mlp/act_fn/Mul_4_output_0", "/blocks.22/mlp/act_fn/Mul_5_output_0", "/blocks.22/mlp/up_proj/FakeLinear_output_0", "/blocks.22/mlp/Mul_output_0", "/blocks.22/mlp/down_proj/FakeLinear_output_0", "/blocks.22/post_feedforward_layernorm/Cast_output_0", "/blocks.22/post_feedforward_layernorm/Mul_1_output_0", "/blocks.22/Add_1_output_0", "/blocks.23/Reshape_output_0", "/blocks.23/input_layernorm/Mul_1_output_0", "/blocks.23/self_attn/q_proj/FakeLinear_output_0", "/blocks.23/self_attn/Shape_output_0", "Shape10003", "Rank10005", "BinaryOp10007", "Unsqueeze10008", "BinaryOp10010", "Unsqueeze10011", "StridedSlice10014", "Squeeze10015", "BinaryOp10017", "/blocks.23/self_attn/Gather_output_0", "/blocks.23/self_attn/Unsqueeze_output_0", "Unsqueeze10025", "Unsqueeze10028", "StridedSlice10031", "Squeeze10032", "BinaryOp10033", "BinaryOp10034", "/blocks.23/self_attn/Gather_1_output_0", "/blocks.23/self_attn/Unsqueeze_1_output_0", "/blocks.23/self_attn/Concat_output_0", "/blocks.23/self_attn/Reshape_output_0", "/blocks.23/self_attn/q_norm/Cast_output_0", "/blocks.23/self_attn/q_norm/Mul_1_output_0", "/blocks.23/self_attn/Mul_output_0", "/blocks.23/self_attn/Shape_2_output_0", "Shape10152", "Rank10154", "BinaryOp10156", "Unsqueeze10157", "BinaryOp10159", "Unsqueeze10160", "StridedSlice10163", "Squeeze10164", "BinaryOp10165", "BinaryOp10166", "/blocks.23/self_attn/Gather_2_output_0", "/blocks.23/self_attn/Div_output_0", "/blocks.23/self_attn/Unsqueeze_7_output_0", "/blocks.23/self_attn/Slice_1_output_0", "/blocks.23/self_attn/Neg_output_0", "/blocks.23/self_attn/Unsqueeze_6_output_0", "/blocks.23/self_attn/Slice_output_0", "/blocks.23/self_attn/Concat_3_output_0", "/blocks.23/self_attn/Mul_1_output_0", "/blocks.23/self_attn/Add_output_0", "/blocks.23/self_attn/k_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_2_output_0", "/blocks.23/self_attn/Unsqueeze_3_output_0", "/blocks.23/self_attn/Concat_1_output_0", "/blocks.23/self_attn/Reshape_1_output_0", "/blocks.23/self_attn/k_norm/Cast_output_0", "/blocks.23/self_attn/k_norm/Mul_1_output_0", "/blocks.23/self_attn/Mul_2_output_0", "/blocks.23/self_attn/Shape_3_output_0", "Shape10050", "Rank10052", "BinaryOp10054", "Unsqueeze10055", "BinaryOp10057", "Unsqueeze10058", "StridedSlice10061", "Squeeze10062", "BinaryOp10063", "BinaryOp10064", "/blocks.23/self_attn/Gather_3_output_0", "/blocks.23/self_attn/Div_1_output_0", "/blocks.23/self_attn/Unsqueeze_9_output_0", "/blocks.23/self_attn/Slice_3_output_0", "/blocks.23/self_attn/Neg_1_output_0", "/blocks.23/self_attn/Unsqueeze_8_output_0", "/blocks.23/self_attn/Slice_2_output_0", "/blocks.23/self_attn/Concat_4_output_0", "/blocks.23/self_attn/Mul_3_output_0", "/blocks.23/self_attn/Add_1_output_0", "/blocks.23/self_attn/v_proj/FakeLinear_output_0", "/blocks.23/self_attn/Unsqueeze_4_output_0", "/blocks.23/self_attn/Unsqueeze_5_output_0", "/blocks.23/self_attn/Concat_2_output_0", "/blocks.23/self_attn/Reshape_2_output_0", "Unsqueeze10273", "Unsqueeze10276", "StridedSlice10279", "Squeeze10280", "BinaryOp10282", "/Gather_47_output_0", "/blocks.23/self_attn/Reshape_7_output_0", "/blocks.23/self_attn/o_proj/FakeLinear_output_0", "/blocks.23/post_attention_layernorm/Cast_output_0", "/blocks.23/post_attention_layernorm/Mul_1_output_0", "/blocks.23/Add_output_0", "/blocks.23/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.23/mlp/gate_proj/FakeLinear_output_0", "/blocks.23/mlp/act_fn/Mul_output_0", "/blocks.23/mlp/act_fn/Mul_1_output_0", "/blocks.23/mlp/act_fn/Mul_2_output_0", "/blocks.23/mlp/act_fn/Add_output_0", "/blocks.23/mlp/act_fn/Mul_3_output_0", "/blocks.23/mlp/act_fn/Tanh_output_0", "/blocks.23/mlp/act_fn/Add_1_output_0", "/blocks.23/mlp/act_fn/Mul_4_output_0", "/blocks.23/mlp/act_fn/Mul_5_output_0", "/blocks.23/mlp/up_proj/FakeLinear_output_0", "/blocks.23/mlp/Mul_output_0", "/blocks.23/mlp/down_proj/FakeLinear_output_0", "/blocks.23/post_feedforward_layernorm/Cast_output_0", "/blocks.23/post_feedforward_layernorm/Mul_1_output_0", "/blocks.23/Add_1_output_0", "/blocks.24/Reshape_output_0", "/blocks.24/input_layernorm/Mul_1_output_0", "/blocks.24/self_attn/q_proj/FakeLinear_output_0", "/blocks.24/self_attn/Shape_output_0", "Shape10433", "Rank10435", "BinaryOp10437", "Unsqueeze10438", "BinaryOp10440", "Unsqueeze10441", "StridedSlice10444", "Squeeze10445", "BinaryOp10447", "/blocks.24/self_attn/Gather_output_0", "/blocks.24/self_attn/Unsqueeze_output_0", "Unsqueeze10455", "Unsqueeze10458", "StridedSlice10461", "Squeeze10462", "BinaryOp10463", "BinaryOp10464", "/blocks.24/self_attn/Gather_1_output_0", "/blocks.24/self_attn/Unsqueeze_1_output_0", "/blocks.24/self_attn/Concat_output_0", "/blocks.24/self_attn/Reshape_output_0", "/blocks.24/self_attn/q_norm/Cast_output_0", "/blocks.24/self_attn/q_norm/Mul_1_output_0", "/blocks.24/self_attn/Mul_output_0", "/blocks.24/self_attn/Shape_2_output_0", "Shape10582", "Rank10584", "BinaryOp10586", "Unsqueeze10587", "BinaryOp10589", "Unsqueeze10590", "StridedSlice10593", "Squeeze10594", "BinaryOp10595", "BinaryOp10596", "/blocks.24/self_attn/Gather_2_output_0", "/blocks.24/self_attn/Div_output_0", "/blocks.24/self_attn/Unsqueeze_7_output_0", "/blocks.24/self_attn/Slice_1_output_0", "/blocks.24/self_attn/Neg_output_0", "/blocks.24/self_attn/Unsqueeze_6_output_0", "/blocks.24/self_attn/Slice_output_0", "/blocks.24/self_attn/Concat_3_output_0", "/blocks.24/self_attn/Mul_1_output_0", "/blocks.24/self_attn/Add_output_0", "/blocks.24/self_attn/k_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_2_output_0", "/blocks.24/self_attn/Unsqueeze_3_output_0", "/blocks.24/self_attn/Concat_1_output_0", "/blocks.24/self_attn/Reshape_1_output_0", "/blocks.24/self_attn/k_norm/Cast_output_0", "/blocks.24/self_attn/k_norm/Mul_1_output_0", "/blocks.24/self_attn/Mul_2_output_0", "/blocks.24/self_attn/Shape_3_output_0", "Shape10480", "Rank10482", "BinaryOp10484", "Unsqueeze10485", "BinaryOp10487", "Unsqueeze10488", "StridedSlice10491", "Squeeze10492", "BinaryOp10493", "BinaryOp10494", "/blocks.24/self_attn/Gather_3_output_0", "/blocks.24/self_attn/Div_1_output_0", "/blocks.24/self_attn/Unsqueeze_9_output_0", "/blocks.24/self_attn/Slice_3_output_0", "/blocks.24/self_attn/Neg_1_output_0", "/blocks.24/self_attn/Unsqueeze_8_output_0", "/blocks.24/self_attn/Slice_2_output_0", "/blocks.24/self_attn/Concat_4_output_0", "/blocks.24/self_attn/Mul_3_output_0", "/blocks.24/self_attn/Add_1_output_0", "/blocks.24/self_attn/v_proj/FakeLinear_output_0", "/blocks.24/self_attn/Unsqueeze_4_output_0", "/blocks.24/self_attn/Unsqueeze_5_output_0", "/blocks.24/self_attn/Concat_2_output_0", "/blocks.24/self_attn/Reshape_2_output_0", "Unsqueeze10703", "Unsqueeze10706", "StridedSlice10709", "Squeeze10710", "BinaryOp10711", "BinaryOp10712", "/Gather_49_output_0", "/blocks.24/self_attn/Reshape_7_output_0", "/blocks.24/self_attn/o_proj/FakeLinear_output_0", "/blocks.24/post_attention_layernorm/Cast_output_0", "/blocks.24/post_attention_layernorm/Mul_1_output_0", "/blocks.24/Add_output_0", "/blocks.24/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.24/mlp/gate_proj/FakeLinear_output_0", "/blocks.24/mlp/act_fn/Mul_output_0", "/blocks.24/mlp/act_fn/Mul_1_output_0", "/blocks.24/mlp/act_fn/Mul_2_output_0", "/blocks.24/mlp/act_fn/Add_output_0", "/blocks.24/mlp/act_fn/Mul_3_output_0", "/blocks.24/mlp/act_fn/Tanh_output_0", "/blocks.24/mlp/act_fn/Add_1_output_0", "/blocks.24/mlp/act_fn/Mul_4_output_0", "/blocks.24/mlp/act_fn/Mul_5_output_0", "/blocks.24/mlp/up_proj/FakeLinear_output_0", "/blocks.24/mlp/Mul_output_0", "/blocks.24/mlp/down_proj/FakeLinear_output_0", "/blocks.24/post_feedforward_layernorm/Cast_output_0", "/blocks.24/post_feedforward_layernorm/Mul_1_output_0", "/blocks.24/Add_1_output_0", "/blocks.25/Reshape_output_0", "/blocks.25/input_layernorm/Mul_1_output_0", "/blocks.25/self_attn/q_proj/FakeLinear_output_0", "/blocks.25/self_attn/Shape_output_0", "Shape10863", "Rank10865", "BinaryOp10867", "Unsqueeze10868", "BinaryOp10870", "Unsqueeze10871", "StridedSlice10874", "Squeeze10875", "BinaryOp10877", "/blocks.25/self_attn/Gather_output_0", "/blocks.25/self_attn/Unsqueeze_output_0", "Unsqueeze10885", "Unsqueeze10888", "StridedSlice10891", "Squeeze10892", "BinaryOp10893", "BinaryOp10894", "/blocks.25/self_attn/Gather_1_output_0", "/blocks.25/self_attn/Unsqueeze_1_output_0", "/blocks.25/self_attn/Concat_output_0", "/blocks.25/self_attn/Reshape_output_0", "/blocks.25/self_attn/q_norm/Cast_output_0", "/blocks.25/self_attn/q_norm/Mul_1_output_0", "/blocks.25/self_attn/Mul_output_0", "/blocks.25/self_attn/Shape_2_output_0", "Shape10981", "Rank10983", "BinaryOp10985", "Unsqueeze10986", "BinaryOp10988", "Unsqueeze10989", "StridedSlice10992", "Squeeze10993", "BinaryOp10994", "BinaryOp10995", "/blocks.25/self_attn/Gather_2_output_0", "/blocks.25/self_attn/Div_output_0", "/blocks.25/self_attn/Unsqueeze_7_output_0", "/blocks.25/self_attn/Slice_1_output_0", "/blocks.25/self_attn/Neg_output_0", "/blocks.25/self_attn/Unsqueeze_6_output_0", "/blocks.25/self_attn/Slice_output_0", "/blocks.25/self_attn/Concat_3_output_0", "/blocks.25/self_attn/Mul_1_output_0", "/blocks.25/self_attn/Add_output_0", "/blocks.25/self_attn/k_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_2_output_0", "/blocks.25/self_attn/Unsqueeze_3_output_0", "/blocks.25/self_attn/Concat_1_output_0", "/blocks.25/self_attn/Reshape_1_output_0", "/blocks.25/self_attn/k_norm/Cast_output_0", "/blocks.25/self_attn/k_norm/Mul_1_output_0", "/blocks.25/self_attn/Mul_2_output_0", "/blocks.25/self_attn/Shape_3_output_0", "Shape10910", "Rank10912", "BinaryOp10914", "Unsqueeze10915", "BinaryOp10917", "Unsqueeze10918", "StridedSlice10921", "Squeeze10922", "BinaryOp10923", "BinaryOp10924", "/blocks.25/self_attn/Gather_3_output_0", "/blocks.25/self_attn/Div_1_output_0", "/blocks.25/self_attn/Unsqueeze_9_output_0", "/blocks.25/self_attn/Slice_3_output_0", "/blocks.25/self_attn/Neg_1_output_0", "/blocks.25/self_attn/Unsqueeze_8_output_0", "/blocks.25/self_attn/Slice_2_output_0", "/blocks.25/self_attn/Concat_4_output_0", "/blocks.25/self_attn/Mul_3_output_0", "/blocks.25/self_attn/Add_1_output_0", "/blocks.25/self_attn/v_proj/FakeLinear_output_0", "/blocks.25/self_attn/Unsqueeze_4_output_0", "/blocks.25/self_attn/Unsqueeze_5_output_0", "/blocks.25/self_attn/Concat_2_output_0", "/blocks.25/self_attn/Reshape_2_output_0", "Unsqueeze11102", "Unsqueeze11105", "StridedSlice11108", "Squeeze11109", "BinaryOp11110", "BinaryOp11111", "/Gather_51_output_0", "/blocks.25/self_attn/Reshape_7_output_0", "/blocks.25/self_attn/o_proj/FakeLinear_output_0", "/blocks.25/post_attention_layernorm/Cast_output_0", "/blocks.25/post_attention_layernorm/Mul_1_output_0", "/blocks.25/Add_output_0", "/blocks.25/pre_feedforward_layernorm/Mul_1_output_0", "/blocks.25/mlp/gate_proj/FakeLinear_output_0", "/blocks.25/mlp/act_fn/Mul_output_0", "/blocks.25/mlp/act_fn/Mul_1_output_0", "/blocks.25/mlp/act_fn/Mul_2_output_0", "/blocks.25/mlp/act_fn/Add_output_0", "/blocks.25/mlp/act_fn/Mul_3_output_0", "/blocks.25/mlp/act_fn/Tanh_output_0", "/blocks.25/mlp/act_fn/Add_1_output_0", "/blocks.25/mlp/act_fn/Mul_4_output_0", "/blocks.25/mlp/act_fn/Mul_5_output_0", "/blocks.25/mlp/up_proj/FakeLinear_output_0", "/blocks.25/mlp/Mul_output_0", "/blocks.25/mlp/down_proj/FakeLinear_output_0", "/blocks.25/post_feedforward_layernorm/Cast_output_0", "/blocks.25/post_feedforward_layernorm/Mul_1_output_0", "/blocks.25/Add_1_output_0", "/Slice_output_0", "hidden_states", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] +, "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "15da5220-beac-4a08-850d-136e489a5b7f" }