{ "oplists": [ { "type": "Input", "name": "input_ids", "outputIndexes": [ 2 ] , "main_type": "Input", "main": { "dims": [ 1, 1, 576 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Input", "name": "attention_mask", "outputIndexes": [ 124 ] , "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Input", "name": "position_ids", "outputIndexes": [ 34 ] , "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Input", "name": "past_key_values", "outputIndexes": [ 0 ] , "main_type": "Input", "main": { "dims": [ 30, 2, 1, -1, 3, 64 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Input", "name": "logits_index", "outputIndexes": [ 2716 ] , "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "presents", "inputIndexes": [ 0 ] , "outputIndexes": [ 1 ] , "main_type": "Reshape", "main": { "dims": [ -1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/Constant_output_0", "outputIndexes": [ 3 ] , "main_type": "Blob", "main": { "dims": [ 3 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 1, -1, 576 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_output_0", "inputIndexes": [ 2, 3 ] , "outputIndexes": [ 4 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm/Mul_1_output_0", "inputIndexes": [ 4 ] , "outputIndexes": [ 5 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 0, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 5 ] , "outputIndexes": [ 2720 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2720 ] , "outputIndexes": [ 2721 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/self_attn/q_proj/Linear", "inputIndexes": [ 2721 ] , "outputIndexes": [ 2722 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4608, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2722 ] , "outputIndexes": [ 2723 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2723 ] , "outputIndexes": [ 6 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_output_0", "inputIndexes": [ 5 ] , "outputIndexes": [ 7 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape51", "inputIndexes": [ 7 ] , "outputIndexes": [ 8 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank53", "inputIndexes": [ 7 ] , "outputIndexes": [ 9 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp55", "inputIndexes": [ 9, 9 ] , "outputIndexes": [ 10 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze56", "inputIndexes": [ 10 ] , "outputIndexes": [ 11 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "Const9", "outputIndexes": [ 12 ] , "main_type": "Blob", "main": { "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 1 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp58", "inputIndexes": [ 10, 12 ] , "outputIndexes": [ 13 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze59", "inputIndexes": [ 13 ] , "outputIndexes": [ 14 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "Unsqueeze61", "outputIndexes": [ 15 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 1 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice62", "inputIndexes": [ 8, 11, 14, 15 ] , "outputIndexes": [ 16 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze63", "inputIndexes": [ 16 ] , "outputIndexes": [ 17 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp65", "inputIndexes": [ 17, 17 ] , "outputIndexes": [ 18 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_1_output_0", "inputIndexes": [ 7, 18, 10 ] , "outputIndexes": [ 19 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/rotary/Constant_4_output_0", "outputIndexes": [ 20 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_output_0", "inputIndexes": [ 19, 20 ] , "outputIndexes": [ 21 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze75", "inputIndexes": [ 10 ] , "outputIndexes": [ 22 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze78", "inputIndexes": [ 13 ] , "outputIndexes": [ 23 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice81", "inputIndexes": [ 8, 22, 23, 15 ] , "outputIndexes": [ 24 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze82", "inputIndexes": [ 24 ] , "outputIndexes": [ 25 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp83", "inputIndexes": [ 12, 25 ] , "outputIndexes": [ 26 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp84", "inputIndexes": [ 26, 25 ] , "outputIndexes": [ 27 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_2_output_0", "inputIndexes": [ 7, 27, 10 ] , "outputIndexes": [ 28 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_1_output_0", "inputIndexes": [ 28, 20 ] , "outputIndexes": [ 29 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/Constant_4_output_0", "outputIndexes": [ 30 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 9 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/Constant_5_output_0", "outputIndexes": [ 31 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 64 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_output_0", "inputIndexes": [ 21, 29, 30, 31 ] , "outputIndexes": [ 32 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_1_output_0", "inputIndexes": [ 6, 32 ] , "outputIndexes": [ 33 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Cast", "name": "/rotary/Cast_output_0", "inputIndexes": [ 34 ] , "outputIndexes": [ 35 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 36 ] , "main_type": "Blob", "main": { "dims": [ 2 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ -1, 1 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/rotary/Reshape_output_0", "inputIndexes": [ 35, 36 ] , "outputIndexes": [ 37 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/rotary/Constant_2_output_0", "outputIndexes": [ 38 ] , "main_type": "Blob", "main": { "dims": [ 32 ] , "dataType": "DT_FLOAT", "dataFormat": "NCHW", "float32s": [ 1.0, 0.697831, 0.486968, 0.339821, 0.237137, 0.165482, 0.115478, 0.080584, 0.056234, 0.039242, 0.027384, 0.01911, 0.013335, 0.009306, 0.006494, 0.004532, 0.003162, 0.002207, 0.00154, 0.001075, 0.00075, 0.000523, 0.000365, 0.000255, 0.000178, 0.000124, 0.000087, 0.00006, 0.000042, 0.000029, 0.000021, 0.000014 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/rotary/Mul_output_0", "inputIndexes": [ 37, 38 ] , "outputIndexes": [ 39 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/rotary/Cos_output_0", "inputIndexes": [ 39 ] , "outputIndexes": [ 40 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/rotary/Unsqueeze_output_0", "inputIndexes": [ 40, 20 ] , "outputIndexes": [ 41 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/rotary/Sin_output_0", "inputIndexes": [ 39 ] , "outputIndexes": [ 42 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/rotary/Unsqueeze_1_output_0", "inputIndexes": [ 42, 20 ] , "outputIndexes": [ 43 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/rotary/Concat_output_0", "inputIndexes": [ 41, 43 ] , "outputIndexes": [ 44 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/rotary/Concat_1_output_0", "inputIndexes": [ 44, 44 ] , "outputIndexes": [ 45 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/rotary/Constant_7_output_0", "outputIndexes": [ 46 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 2 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/rotary/Unsqueeze_2_output_0", "inputIndexes": [ 45, 46 ] , "outputIndexes": [ 47 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/rotary/Unsqueeze_3_output_0", "inputIndexes": [ 47, 15 ] , "outputIndexes": [ 48 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "Shape107", "inputIndexes": [ 48 ] , "outputIndexes": [ 49 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank109", "inputIndexes": [ 48 ] , "outputIndexes": [ 50 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp111", "inputIndexes": [ 50, 50 ] , "outputIndexes": [ 51 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze112", "inputIndexes": [ 51 ] , "outputIndexes": [ 52 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp114", "inputIndexes": [ 51, 12 ] , "outputIndexes": [ 53 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze115", "inputIndexes": [ 53 ] , "outputIndexes": [ 54 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice118", "inputIndexes": [ 49, 52, 54, 15 ] , "outputIndexes": [ 55 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze119", "inputIndexes": [ 55 ] , "outputIndexes": [ 56 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp121", "inputIndexes": [ 56, 56 ] , "outputIndexes": [ 57 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_3_output_0", "inputIndexes": [ 48, 57, 51 ] , "outputIndexes": [ 58 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_output_0", "inputIndexes": [ 33, 58 ] , "outputIndexes": [ 59 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_2_output_0", "inputIndexes": [ 33 ] , "outputIndexes": [ 60 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Const", "name": "/Constant_6_output_0", "outputIndexes": [ 61 ] , "main_type": "Blob", "main": { "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 3 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "Shape238", "inputIndexes": [ 60 ] , "outputIndexes": [ 62 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank240", "inputIndexes": [ 60 ] , "outputIndexes": [ 63 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp242", "inputIndexes": [ 63, 63 ] , "outputIndexes": [ 64 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze243", "inputIndexes": [ 64 ] , "outputIndexes": [ 65 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp245", "inputIndexes": [ 64, 12 ] , "outputIndexes": [ 66 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze246", "inputIndexes": [ 66 ] , "outputIndexes": [ 67 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice249", "inputIndexes": [ 62, 65, 67, 15 ] , "outputIndexes": [ 68 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze250", "inputIndexes": [ 68 ] , "outputIndexes": [ 69 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp251", "inputIndexes": [ 61, 69 ] , "outputIndexes": [ 70 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp252", "inputIndexes": [ 70, 69 ] , "outputIndexes": [ 71 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_5_output_0", "inputIndexes": [ 60, 71, 64 ] , "outputIndexes": [ 72 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/rotary/Constant_6_output_0", "outputIndexes": [ 73 ] , "main_type": "Blob", "main": { "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 2 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_output_0", "inputIndexes": [ 72, 73 ] , "outputIndexes": [ 74 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_7_output_0", "inputIndexes": [ 74, 20 ] , "outputIndexes": [ 75 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/Constant_19_output_0", "outputIndexes": [ 76 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 1073741824 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Const", "name": "/Constant_7_output_0", "outputIndexes": [ 77 ] , "main_type": "Blob", "main": { "dims": [ 1 ] , "dataType": "DT_INT32", "dataFormat": "NCHW", "int32s": [ 3 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_1_output_0", "inputIndexes": [ 33, 75, 76, 77, 15 ] , "outputIndexes": [ 78 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_output_0", "inputIndexes": [ 78 ] , "outputIndexes": [ 79 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_6_output_0", "inputIndexes": [ 74, 20 ] , "outputIndexes": [ 80 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_output_0", "inputIndexes": [ 33, 20, 80, 77, 15 ] , "outputIndexes": [ 81 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_3_output_0", "inputIndexes": [ 79, 81 ] , "outputIndexes": [ 82 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze157", "inputIndexes": [ 51 ] , "outputIndexes": [ 83 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze160", "inputIndexes": [ 53 ] , "outputIndexes": [ 84 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice163", "inputIndexes": [ 49, 83, 84, 15 ] , "outputIndexes": [ 85 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze164", "inputIndexes": [ 85 ] , "outputIndexes": [ 86 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp165", "inputIndexes": [ 12, 86 ] , "outputIndexes": [ 87 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp166", "inputIndexes": [ 87, 86 ] , "outputIndexes": [ 88 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_4_output_0", "inputIndexes": [ 48, 88, 51 ] , "outputIndexes": [ 89 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_1_output_0", "inputIndexes": [ 82, 89 ] , "outputIndexes": [ 90 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_output_0", "inputIndexes": [ 59, 90 ] , "outputIndexes": [ 91 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/self_attn/k_proj/Linear", "inputIndexes": [ 2721 ] , "outputIndexes": [ 2726 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 378118, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2726 ] , "outputIndexes": [ 2727 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2727 ] , "outputIndexes": [ 92 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_2_output_0", "inputIndexes": [ 19, 20 ] , "outputIndexes": [ 93 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_3_output_0", "inputIndexes": [ 28, 20 ] , "outputIndexes": [ 94 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_1_output_0", "inputIndexes": [ 93, 94, 77, 31 ] , "outputIndexes": [ 95 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_2_output_0", "inputIndexes": [ 92, 95 ] , "outputIndexes": [ 96 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_2_output_0", "inputIndexes": [ 96, 58 ] , "outputIndexes": [ 97 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_3_output_0", "inputIndexes": [ 96 ] , "outputIndexes": [ 98 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape126", "inputIndexes": [ 98 ] , "outputIndexes": [ 99 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank128", "inputIndexes": [ 98 ] , "outputIndexes": [ 100 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp130", "inputIndexes": [ 100, 100 ] , "outputIndexes": [ 101 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze131", "inputIndexes": [ 101 ] , "outputIndexes": [ 102 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp133", "inputIndexes": [ 101, 12 ] , "outputIndexes": [ 103 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze134", "inputIndexes": [ 103 ] , "outputIndexes": [ 104 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice137", "inputIndexes": [ 99, 102, 104, 15 ] , "outputIndexes": [ 105 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze138", "inputIndexes": [ 105 ] , "outputIndexes": [ 106 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp139", "inputIndexes": [ 61, 106 ] , "outputIndexes": [ 107 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp140", "inputIndexes": [ 107, 106 ] , "outputIndexes": [ 108 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_6_output_0", "inputIndexes": [ 98, 108, 101 ] , "outputIndexes": [ 109 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_1_output_0", "inputIndexes": [ 109, 73 ] , "outputIndexes": [ 110 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_9_output_0", "inputIndexes": [ 110, 20 ] , "outputIndexes": [ 111 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_3_output_0", "inputIndexes": [ 96, 111, 76, 77, 15 ] , "outputIndexes": [ 112 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_1_output_0", "inputIndexes": [ 112 ] , "outputIndexes": [ 113 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_8_output_0", "inputIndexes": [ 110, 20 ] , "outputIndexes": [ 114 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_2_output_0", "inputIndexes": [ 96, 20, 114, 77, 15 ] , "outputIndexes": [ 115 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_4_output_0", "inputIndexes": [ 113, 115 ] , "outputIndexes": [ 116 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_3_output_0", "inputIndexes": [ 116, 89 ] , "outputIndexes": [ 117 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_1_output_0", "inputIndexes": [ 97, 117 ] , "outputIndexes": [ 118 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/self_attn/v_proj/Linear", "inputIndexes": [ 2721 ] , "outputIndexes": [ 2730 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 502796, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2730 ] , "outputIndexes": [ 2731 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2731 ] , "outputIndexes": [ 119 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_4_output_0", "inputIndexes": [ 19, 20 ] , "outputIndexes": [ 120 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_5_output_0", "inputIndexes": [ 28, 20 ] , "outputIndexes": [ 121 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_2_output_0", "inputIndexes": [ 120, 121, 77, 31 ] , "outputIndexes": [ 122 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_3_output_0", "inputIndexes": [ 119, 122 ] , "outputIndexes": [ 123 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_8_output_0", "inputIndexes": [ 91, 118, 123, 124 ] , "outputIndexes": [ 125 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 125 ] , "outputIndexes": [ 2732 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2732 ] , "outputIndexes": [ 2733 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/self_attn/o_proj/Linear", "inputIndexes": [ 2733 ] , "outputIndexes": [ 2734 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 627474, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2734 ] , "outputIndexes": [ 2735 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2735 ] , "outputIndexes": [ 126 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_3_output_0", "inputIndexes": [ 4, 126 ] , "outputIndexes": [ 127 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm/Mul_1_output_0", "inputIndexes": [ 127 ] , "outputIndexes": [ 128 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 1000984, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 128 ] , "outputIndexes": [ 2736 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2736 ] , "outputIndexes": [ 2737 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/mlp/gate_proj/Linear", "inputIndexes": [ 2737 ] , "outputIndexes": [ 2738 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1005592, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2738 ] , "outputIndexes": [ 2739 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2739 ] , "outputIndexes": [ 129 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn/Mul_output_0", "inputIndexes": [ 129 ] , "outputIndexes": [ 130 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/mlp/up_proj/Linear", "inputIndexes": [ 2737 ] , "outputIndexes": [ 2742 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2001182, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2742 ] , "outputIndexes": [ 2743 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2743 ] , "outputIndexes": [ 131 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp/Mul_output_0", "inputIndexes": [ 130, 131 ] , "outputIndexes": [ 132 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 132 ] , "outputIndexes": [ 2744 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2744 ] , "outputIndexes": [ 2745 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.0/mlp/down_proj/Linear", "inputIndexes": [ 2745 ] , "outputIndexes": [ 2746 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 2996772, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.0/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2746 ] , "outputIndexes": [ 2747 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2747 ] , "outputIndexes": [ 133 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_4_output_0", "inputIndexes": [ 127, 133 ] , "outputIndexes": [ 134 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_9_output_0", "inputIndexes": [ 134, 3 ] , "outputIndexes": [ 135 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_1/Mul_1_output_0", "inputIndexes": [ 135 ] , "outputIndexes": [ 136 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 3937066, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 136 ] , "outputIndexes": [ 2748 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2748 ] , "outputIndexes": [ 2749 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/self_attn/q_proj/Linear", "inputIndexes": [ 2749 ] , "outputIndexes": [ 2750 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3941674, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2750 ] , "outputIndexes": [ 2751 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2751 ] , "outputIndexes": [ 137 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_14_output_0", "inputIndexes": [ 136 ] , "outputIndexes": [ 138 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape481", "inputIndexes": [ 138 ] , "outputIndexes": [ 139 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank483", "inputIndexes": [ 138 ] , "outputIndexes": [ 140 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp485", "inputIndexes": [ 140, 140 ] , "outputIndexes": [ 141 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze486", "inputIndexes": [ 141 ] , "outputIndexes": [ 142 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp488", "inputIndexes": [ 141, 12 ] , "outputIndexes": [ 143 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze489", "inputIndexes": [ 143 ] , "outputIndexes": [ 144 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice492", "inputIndexes": [ 139, 142, 144, 15 ] , "outputIndexes": [ 145 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze493", "inputIndexes": [ 145 ] , "outputIndexes": [ 146 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp495", "inputIndexes": [ 146, 146 ] , "outputIndexes": [ 147 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_18_output_0", "inputIndexes": [ 138, 147, 141 ] , "outputIndexes": [ 148 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_32_output_0", "inputIndexes": [ 148, 20 ] , "outputIndexes": [ 149 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze503", "inputIndexes": [ 141 ] , "outputIndexes": [ 150 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze506", "inputIndexes": [ 143 ] , "outputIndexes": [ 151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice509", "inputIndexes": [ 139, 150, 151, 15 ] , "outputIndexes": [ 152 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze510", "inputIndexes": [ 152 ] , "outputIndexes": [ 153 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp511", "inputIndexes": [ 12, 153 ] , "outputIndexes": [ 154 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp512", "inputIndexes": [ 154, 153 ] , "outputIndexes": [ 155 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_19_output_0", "inputIndexes": [ 138, 155, 141 ] , "outputIndexes": [ 156 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_33_output_0", "inputIndexes": [ 156, 20 ] , "outputIndexes": [ 157 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_13_output_0", "inputIndexes": [ 149, 157, 30, 31 ] , "outputIndexes": [ 158 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_10_output_0", "inputIndexes": [ 137, 158 ] , "outputIndexes": [ 159 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_8_output_0", "inputIndexes": [ 159, 58 ] , "outputIndexes": [ 160 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_16_output_0", "inputIndexes": [ 159 ] , "outputIndexes": [ 161 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape612", "inputIndexes": [ 161 ] , "outputIndexes": [ 162 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank614", "inputIndexes": [ 161 ] , "outputIndexes": [ 163 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp616", "inputIndexes": [ 163, 163 ] , "outputIndexes": [ 164 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze617", "inputIndexes": [ 164 ] , "outputIndexes": [ 165 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp619", "inputIndexes": [ 164, 12 ] , "outputIndexes": [ 166 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze620", "inputIndexes": [ 166 ] , "outputIndexes": [ 167 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice623", "inputIndexes": [ 162, 165, 167, 15 ] , "outputIndexes": [ 168 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze624", "inputIndexes": [ 168 ] , "outputIndexes": [ 169 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp625", "inputIndexes": [ 61, 169 ] , "outputIndexes": [ 170 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp626", "inputIndexes": [ 170, 169 ] , "outputIndexes": [ 171 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_20_output_0", "inputIndexes": [ 161, 171, 164 ] , "outputIndexes": [ 172 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_3_output_0", "inputIndexes": [ 172, 73 ] , "outputIndexes": [ 173 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_39_output_0", "inputIndexes": [ 173, 20 ] , "outputIndexes": [ 174 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_5_output_0", "inputIndexes": [ 159, 174, 76, 77, 15 ] , "outputIndexes": [ 175 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_2_output_0", "inputIndexes": [ 175 ] , "outputIndexes": [ 176 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_38_output_0", "inputIndexes": [ 173, 20 ] , "outputIndexes": [ 177 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_4_output_0", "inputIndexes": [ 159, 20, 177, 77, 15 ] , "outputIndexes": [ 178 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_16_output_0", "inputIndexes": [ 176, 178 ] , "outputIndexes": [ 179 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_9_output_0", "inputIndexes": [ 179, 89 ] , "outputIndexes": [ 180 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_5_output_0", "inputIndexes": [ 160, 180 ] , "outputIndexes": [ 181 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/self_attn/k_proj/Linear", "inputIndexes": [ 2749 ] , "outputIndexes": [ 2754 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4315184, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2754 ] , "outputIndexes": [ 2755 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2755 ] , "outputIndexes": [ 182 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_34_output_0", "inputIndexes": [ 148, 20 ] , "outputIndexes": [ 183 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_35_output_0", "inputIndexes": [ 156, 20 ] , "outputIndexes": [ 184 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_14_output_0", "inputIndexes": [ 183, 184, 77, 31 ] , "outputIndexes": [ 185 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_11_output_0", "inputIndexes": [ 182, 185 ] , "outputIndexes": [ 186 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_10_output_0", "inputIndexes": [ 186, 58 ] , "outputIndexes": [ 187 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_17_output_0", "inputIndexes": [ 186 ] , "outputIndexes": [ 188 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape519", "inputIndexes": [ 188 ] , "outputIndexes": [ 189 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank521", "inputIndexes": [ 188 ] , "outputIndexes": [ 190 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp523", "inputIndexes": [ 190, 190 ] , "outputIndexes": [ 191 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze524", "inputIndexes": [ 191 ] , "outputIndexes": [ 192 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp526", "inputIndexes": [ 191, 12 ] , "outputIndexes": [ 193 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze527", "inputIndexes": [ 193 ] , "outputIndexes": [ 194 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice530", "inputIndexes": [ 189, 192, 194, 15 ] , "outputIndexes": [ 195 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze531", "inputIndexes": [ 195 ] , "outputIndexes": [ 196 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp532", "inputIndexes": [ 61, 196 ] , "outputIndexes": [ 197 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp533", "inputIndexes": [ 197, 196 ] , "outputIndexes": [ 198 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_21_output_0", "inputIndexes": [ 188, 198, 191 ] , "outputIndexes": [ 199 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_4_output_0", "inputIndexes": [ 199, 73 ] , "outputIndexes": [ 200 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_41_output_0", "inputIndexes": [ 200, 20 ] , "outputIndexes": [ 201 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_7_output_0", "inputIndexes": [ 186, 201, 76, 77, 15 ] , "outputIndexes": [ 202 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_3_output_0", "inputIndexes": [ 202 ] , "outputIndexes": [ 203 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_40_output_0", "inputIndexes": [ 200, 20 ] , "outputIndexes": [ 204 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_6_output_0", "inputIndexes": [ 186, 20, 204, 77, 15 ] , "outputIndexes": [ 205 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_17_output_0", "inputIndexes": [ 203, 205 ] , "outputIndexes": [ 206 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_11_output_0", "inputIndexes": [ 206, 89 ] , "outputIndexes": [ 207 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_6_output_0", "inputIndexes": [ 187, 207 ] , "outputIndexes": [ 208 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/self_attn/v_proj/Linear", "inputIndexes": [ 2749 ] , "outputIndexes": [ 2758 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4439862, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2758 ] , "outputIndexes": [ 2759 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2759 ] , "outputIndexes": [ 209 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_36_output_0", "inputIndexes": [ 148, 20 ] , "outputIndexes": [ 210 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_37_output_0", "inputIndexes": [ 156, 20 ] , "outputIndexes": [ 211 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_15_output_0", "inputIndexes": [ 210, 211, 77, 31 ] , "outputIndexes": [ 212 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_12_output_0", "inputIndexes": [ 209, 212 ] , "outputIndexes": [ 213 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_17_output_0", "inputIndexes": [ 181, 208, 213, 124 ] , "outputIndexes": [ 214 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 214 ] , "outputIndexes": [ 2760 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2760 ] , "outputIndexes": [ 2761 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/self_attn/o_proj/Linear", "inputIndexes": [ 2761 ] , "outputIndexes": [ 2762 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4564540, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2762 ] , "outputIndexes": [ 2763 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2763 ] , "outputIndexes": [ 215 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_8_output_0", "inputIndexes": [ 135, 215 ] , "outputIndexes": [ 216 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_1/Mul_1_output_0", "inputIndexes": [ 216 ] , "outputIndexes": [ 217 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 4938050, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 217 ] , "outputIndexes": [ 2764 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2764 ] , "outputIndexes": [ 2765 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/mlp/gate_proj/Linear", "inputIndexes": [ 2765 ] , "outputIndexes": [ 2766 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 4942658, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2766 ] , "outputIndexes": [ 2767 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2767 ] , "outputIndexes": [ 218 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_1/Mul_output_0", "inputIndexes": [ 218 ] , "outputIndexes": [ 219 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/mlp/up_proj/Linear", "inputIndexes": [ 2765 ] , "outputIndexes": [ 2770 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 5938248, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2770 ] , "outputIndexes": [ 2771 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2771 ] , "outputIndexes": [ 220 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_1/Mul_output_0", "inputIndexes": [ 219, 220 ] , "outputIndexes": [ 221 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 221 ] , "outputIndexes": [ 2772 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2772 ] , "outputIndexes": [ 2773 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.1/mlp/down_proj/Linear", "inputIndexes": [ 2773 ] , "outputIndexes": [ 2774 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 6933838, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.1/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2774 ] , "outputIndexes": [ 2775 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2775 ] , "outputIndexes": [ 222 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_9_output_0", "inputIndexes": [ 216, 222 ] , "outputIndexes": [ 223 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_18_output_0", "inputIndexes": [ 223, 3 ] , "outputIndexes": [ 224 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_2/Mul_1_output_0", "inputIndexes": [ 224 ] , "outputIndexes": [ 225 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 7874132, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 225 ] , "outputIndexes": [ 2776 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2776 ] , "outputIndexes": [ 2777 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/self_attn/q_proj/Linear", "inputIndexes": [ 2777 ] , "outputIndexes": [ 2778 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 7878740, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2778 ] , "outputIndexes": [ 2779 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2779 ] , "outputIndexes": [ 226 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_28_output_0", "inputIndexes": [ 225 ] , "outputIndexes": [ 227 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape851", "inputIndexes": [ 227 ] , "outputIndexes": [ 228 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank853", "inputIndexes": [ 227 ] , "outputIndexes": [ 229 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp855", "inputIndexes": [ 229, 229 ] , "outputIndexes": [ 230 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze856", "inputIndexes": [ 230 ] , "outputIndexes": [ 231 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp858", "inputIndexes": [ 230, 12 ] , "outputIndexes": [ 232 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze859", "inputIndexes": [ 232 ] , "outputIndexes": [ 233 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice862", "inputIndexes": [ 228, 231, 233, 15 ] , "outputIndexes": [ 234 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze863", "inputIndexes": [ 234 ] , "outputIndexes": [ 235 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp865", "inputIndexes": [ 235, 235 ] , "outputIndexes": [ 236 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_33_output_0", "inputIndexes": [ 227, 236, 230 ] , "outputIndexes": [ 237 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_64_output_0", "inputIndexes": [ 237, 20 ] , "outputIndexes": [ 238 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze873", "inputIndexes": [ 230 ] , "outputIndexes": [ 239 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze876", "inputIndexes": [ 232 ] , "outputIndexes": [ 240 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice879", "inputIndexes": [ 228, 239, 240, 15 ] , "outputIndexes": [ 241 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze880", "inputIndexes": [ 241 ] , "outputIndexes": [ 242 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp881", "inputIndexes": [ 12, 242 ] , "outputIndexes": [ 243 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp882", "inputIndexes": [ 243, 242 ] , "outputIndexes": [ 244 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_34_output_0", "inputIndexes": [ 227, 244, 230 ] , "outputIndexes": [ 245 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_65_output_0", "inputIndexes": [ 245, 20 ] , "outputIndexes": [ 246 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_26_output_0", "inputIndexes": [ 238, 246, 30, 31 ] , "outputIndexes": [ 247 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_19_output_0", "inputIndexes": [ 226, 247 ] , "outputIndexes": [ 248 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_16_output_0", "inputIndexes": [ 248, 58 ] , "outputIndexes": [ 249 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_30_output_0", "inputIndexes": [ 248 ] , "outputIndexes": [ 250 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape982", "inputIndexes": [ 250 ] , "outputIndexes": [ 251 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank984", "inputIndexes": [ 250 ] , "outputIndexes": [ 252 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp986", "inputIndexes": [ 252, 252 ] , "outputIndexes": [ 253 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze987", "inputIndexes": [ 253 ] , "outputIndexes": [ 254 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp989", "inputIndexes": [ 253, 12 ] , "outputIndexes": [ 255 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze990", "inputIndexes": [ 255 ] , "outputIndexes": [ 256 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice993", "inputIndexes": [ 251, 254, 256, 15 ] , "outputIndexes": [ 257 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze994", "inputIndexes": [ 257 ] , "outputIndexes": [ 258 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp995", "inputIndexes": [ 61, 258 ] , "outputIndexes": [ 259 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp996", "inputIndexes": [ 259, 258 ] , "outputIndexes": [ 260 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_35_output_0", "inputIndexes": [ 250, 260, 253 ] , "outputIndexes": [ 261 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_6_output_0", "inputIndexes": [ 261, 73 ] , "outputIndexes": [ 262 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_71_output_0", "inputIndexes": [ 262, 20 ] , "outputIndexes": [ 263 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_9_output_0", "inputIndexes": [ 248, 263, 76, 77, 15 ] , "outputIndexes": [ 264 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_4_output_0", "inputIndexes": [ 264 ] , "outputIndexes": [ 265 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_70_output_0", "inputIndexes": [ 262, 20 ] , "outputIndexes": [ 266 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_8_output_0", "inputIndexes": [ 248, 20, 266, 77, 15 ] , "outputIndexes": [ 267 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_29_output_0", "inputIndexes": [ 265, 267 ] , "outputIndexes": [ 268 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_17_output_0", "inputIndexes": [ 268, 89 ] , "outputIndexes": [ 269 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_10_output_0", "inputIndexes": [ 249, 269 ] , "outputIndexes": [ 270 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/self_attn/k_proj/Linear", "inputIndexes": [ 2777 ] , "outputIndexes": [ 2782 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8252250, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2782 ] , "outputIndexes": [ 2783 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2783 ] , "outputIndexes": [ 271 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_66_output_0", "inputIndexes": [ 237, 20 ] , "outputIndexes": [ 272 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_67_output_0", "inputIndexes": [ 245, 20 ] , "outputIndexes": [ 273 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_27_output_0", "inputIndexes": [ 272, 273, 77, 31 ] , "outputIndexes": [ 274 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_20_output_0", "inputIndexes": [ 271, 274 ] , "outputIndexes": [ 275 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_18_output_0", "inputIndexes": [ 275, 58 ] , "outputIndexes": [ 276 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_31_output_0", "inputIndexes": [ 275 ] , "outputIndexes": [ 277 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape889", "inputIndexes": [ 277 ] , "outputIndexes": [ 278 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank891", "inputIndexes": [ 277 ] , "outputIndexes": [ 279 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp893", "inputIndexes": [ 279, 279 ] , "outputIndexes": [ 280 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze894", "inputIndexes": [ 280 ] , "outputIndexes": [ 281 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp896", "inputIndexes": [ 280, 12 ] , "outputIndexes": [ 282 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze897", "inputIndexes": [ 282 ] , "outputIndexes": [ 283 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice900", "inputIndexes": [ 278, 281, 283, 15 ] , "outputIndexes": [ 284 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze901", "inputIndexes": [ 284 ] , "outputIndexes": [ 285 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp902", "inputIndexes": [ 61, 285 ] , "outputIndexes": [ 286 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp903", "inputIndexes": [ 286, 285 ] , "outputIndexes": [ 287 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_36_output_0", "inputIndexes": [ 277, 287, 280 ] , "outputIndexes": [ 288 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_7_output_0", "inputIndexes": [ 288, 73 ] , "outputIndexes": [ 289 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_73_output_0", "inputIndexes": [ 289, 20 ] , "outputIndexes": [ 290 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_11_output_0", "inputIndexes": [ 275, 290, 76, 77, 15 ] , "outputIndexes": [ 291 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_5_output_0", "inputIndexes": [ 291 ] , "outputIndexes": [ 292 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_72_output_0", "inputIndexes": [ 289, 20 ] , "outputIndexes": [ 293 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_10_output_0", "inputIndexes": [ 275, 20, 293, 77, 15 ] , "outputIndexes": [ 294 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_30_output_0", "inputIndexes": [ 292, 294 ] , "outputIndexes": [ 295 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_19_output_0", "inputIndexes": [ 295, 89 ] , "outputIndexes": [ 296 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_11_output_0", "inputIndexes": [ 276, 296 ] , "outputIndexes": [ 297 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/self_attn/v_proj/Linear", "inputIndexes": [ 2777 ] , "outputIndexes": [ 2786 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8376928, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2786 ] , "outputIndexes": [ 2787 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2787 ] , "outputIndexes": [ 298 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_68_output_0", "inputIndexes": [ 237, 20 ] , "outputIndexes": [ 299 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_69_output_0", "inputIndexes": [ 245, 20 ] , "outputIndexes": [ 300 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_28_output_0", "inputIndexes": [ 299, 300, 77, 31 ] , "outputIndexes": [ 301 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_21_output_0", "inputIndexes": [ 298, 301 ] , "outputIndexes": [ 302 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_26_output_0", "inputIndexes": [ 270, 297, 302, 124 ] , "outputIndexes": [ 303 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 303 ] , "outputIndexes": [ 2788 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2788 ] , "outputIndexes": [ 2789 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/self_attn/o_proj/Linear", "inputIndexes": [ 2789 ] , "outputIndexes": [ 2790 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8501606, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2790 ] , "outputIndexes": [ 2791 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2791 ] , "outputIndexes": [ 304 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_13_output_0", "inputIndexes": [ 224, 304 ] , "outputIndexes": [ 305 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_2/Mul_1_output_0", "inputIndexes": [ 305 ] , "outputIndexes": [ 306 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 8875116, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 306 ] , "outputIndexes": [ 2792 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2792 ] , "outputIndexes": [ 2793 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/mlp/gate_proj/Linear", "inputIndexes": [ 2793 ] , "outputIndexes": [ 2794 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 8879724, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2794 ] , "outputIndexes": [ 2795 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2795 ] , "outputIndexes": [ 307 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_2/Mul_output_0", "inputIndexes": [ 307 ] , "outputIndexes": [ 308 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/mlp/up_proj/Linear", "inputIndexes": [ 2793 ] , "outputIndexes": [ 2798 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9875314, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2798 ] , "outputIndexes": [ 2799 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2799 ] , "outputIndexes": [ 309 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_2/Mul_output_0", "inputIndexes": [ 308, 309 ] , "outputIndexes": [ 310 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 310 ] , "outputIndexes": [ 2800 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2800 ] , "outputIndexes": [ 2801 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.2/mlp/down_proj/Linear", "inputIndexes": [ 2801 ] , "outputIndexes": [ 2802 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 10870904, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.2/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2802 ] , "outputIndexes": [ 2803 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2803 ] , "outputIndexes": [ 311 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_14_output_0", "inputIndexes": [ 305, 311 ] , "outputIndexes": [ 312 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_27_output_0", "inputIndexes": [ 312, 3 ] , "outputIndexes": [ 313 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_3/Mul_1_output_0", "inputIndexes": [ 313 ] , "outputIndexes": [ 314 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 11811198, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 314 ] , "outputIndexes": [ 2804 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2804 ] , "outputIndexes": [ 2805 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/self_attn/q_proj/Linear", "inputIndexes": [ 2805 ] , "outputIndexes": [ 2806 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 11815806, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2806 ] , "outputIndexes": [ 2807 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2807 ] , "outputIndexes": [ 315 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_42_output_0", "inputIndexes": [ 314 ] , "outputIndexes": [ 316 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1221", "inputIndexes": [ 316 ] , "outputIndexes": [ 317 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1223", "inputIndexes": [ 316 ] , "outputIndexes": [ 318 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1225", "inputIndexes": [ 318, 318 ] , "outputIndexes": [ 319 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1226", "inputIndexes": [ 319 ] , "outputIndexes": [ 320 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1228", "inputIndexes": [ 319, 12 ] , "outputIndexes": [ 321 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1229", "inputIndexes": [ 321 ] , "outputIndexes": [ 322 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1232", "inputIndexes": [ 317, 320, 322, 15 ] , "outputIndexes": [ 323 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1233", "inputIndexes": [ 323 ] , "outputIndexes": [ 324 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1235", "inputIndexes": [ 324, 324 ] , "outputIndexes": [ 325 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_48_output_0", "inputIndexes": [ 316, 325, 319 ] , "outputIndexes": [ 326 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_96_output_0", "inputIndexes": [ 326, 20 ] , "outputIndexes": [ 327 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1243", "inputIndexes": [ 319 ] , "outputIndexes": [ 328 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1246", "inputIndexes": [ 321 ] , "outputIndexes": [ 329 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1249", "inputIndexes": [ 317, 328, 329, 15 ] , "outputIndexes": [ 330 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1250", "inputIndexes": [ 330 ] , "outputIndexes": [ 331 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1251", "inputIndexes": [ 12, 331 ] , "outputIndexes": [ 332 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1252", "inputIndexes": [ 332, 331 ] , "outputIndexes": [ 333 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_49_output_0", "inputIndexes": [ 316, 333, 319 ] , "outputIndexes": [ 334 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_97_output_0", "inputIndexes": [ 334, 20 ] , "outputIndexes": [ 335 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_39_output_0", "inputIndexes": [ 327, 335, 30, 31 ] , "outputIndexes": [ 336 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_28_output_0", "inputIndexes": [ 315, 336 ] , "outputIndexes": [ 337 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_24_output_0", "inputIndexes": [ 337, 58 ] , "outputIndexes": [ 338 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_44_output_0", "inputIndexes": [ 337 ] , "outputIndexes": [ 339 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1353", "inputIndexes": [ 339 ] , "outputIndexes": [ 340 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1355", "inputIndexes": [ 339 ] , "outputIndexes": [ 341 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1357", "inputIndexes": [ 341, 341 ] , "outputIndexes": [ 342 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1358", "inputIndexes": [ 342 ] , "outputIndexes": [ 343 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1360", "inputIndexes": [ 342, 12 ] , "outputIndexes": [ 344 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1361", "inputIndexes": [ 344 ] , "outputIndexes": [ 345 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1364", "inputIndexes": [ 340, 343, 345, 15 ] , "outputIndexes": [ 346 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1365", "inputIndexes": [ 346 ] , "outputIndexes": [ 347 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1366", "inputIndexes": [ 61, 347 ] , "outputIndexes": [ 348 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1367", "inputIndexes": [ 348, 347 ] , "outputIndexes": [ 349 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_50_output_0", "inputIndexes": [ 339, 349, 342 ] , "outputIndexes": [ 350 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_9_output_0", "inputIndexes": [ 350, 73 ] , "outputIndexes": [ 351 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_103_output_0", "inputIndexes": [ 351, 20 ] , "outputIndexes": [ 352 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_13_output_0", "inputIndexes": [ 337, 352, 76, 77, 15 ] , "outputIndexes": [ 353 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_6_output_0", "inputIndexes": [ 353 ] , "outputIndexes": [ 354 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_102_output_0", "inputIndexes": [ 351, 20 ] , "outputIndexes": [ 355 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_12_output_0", "inputIndexes": [ 337, 20, 355, 77, 15 ] , "outputIndexes": [ 356 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_42_output_0", "inputIndexes": [ 354, 356 ] , "outputIndexes": [ 357 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_25_output_0", "inputIndexes": [ 357, 89 ] , "outputIndexes": [ 358 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_15_output_0", "inputIndexes": [ 338, 358 ] , "outputIndexes": [ 359 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/self_attn/k_proj/Linear", "inputIndexes": [ 2805 ] , "outputIndexes": [ 2810 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 12189316, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2810 ] , "outputIndexes": [ 2811 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2811 ] , "outputIndexes": [ 360 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_98_output_0", "inputIndexes": [ 326, 20 ] , "outputIndexes": [ 361 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_99_output_0", "inputIndexes": [ 334, 20 ] , "outputIndexes": [ 362 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_40_output_0", "inputIndexes": [ 361, 362, 77, 31 ] , "outputIndexes": [ 363 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_29_output_0", "inputIndexes": [ 360, 363 ] , "outputIndexes": [ 364 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_26_output_0", "inputIndexes": [ 364, 58 ] , "outputIndexes": [ 365 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_45_output_0", "inputIndexes": [ 364 ] , "outputIndexes": [ 366 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1259", "inputIndexes": [ 366 ] , "outputIndexes": [ 367 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1261", "inputIndexes": [ 366 ] , "outputIndexes": [ 368 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1263", "inputIndexes": [ 368, 368 ] , "outputIndexes": [ 369 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1264", "inputIndexes": [ 369 ] , "outputIndexes": [ 370 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1266", "inputIndexes": [ 369, 12 ] , "outputIndexes": [ 371 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1267", "inputIndexes": [ 371 ] , "outputIndexes": [ 372 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1270", "inputIndexes": [ 367, 370, 372, 15 ] , "outputIndexes": [ 373 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1271", "inputIndexes": [ 373 ] , "outputIndexes": [ 374 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1272", "inputIndexes": [ 61, 374 ] , "outputIndexes": [ 375 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1273", "inputIndexes": [ 375, 374 ] , "outputIndexes": [ 376 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_51_output_0", "inputIndexes": [ 366, 376, 369 ] , "outputIndexes": [ 377 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_10_output_0", "inputIndexes": [ 377, 73 ] , "outputIndexes": [ 378 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_105_output_0", "inputIndexes": [ 378, 20 ] , "outputIndexes": [ 379 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_15_output_0", "inputIndexes": [ 364, 379, 76, 77, 15 ] , "outputIndexes": [ 380 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_7_output_0", "inputIndexes": [ 380 ] , "outputIndexes": [ 381 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_104_output_0", "inputIndexes": [ 378, 20 ] , "outputIndexes": [ 382 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_14_output_0", "inputIndexes": [ 364, 20, 382, 77, 15 ] , "outputIndexes": [ 383 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_43_output_0", "inputIndexes": [ 381, 383 ] , "outputIndexes": [ 384 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_27_output_0", "inputIndexes": [ 384, 89 ] , "outputIndexes": [ 385 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_16_output_0", "inputIndexes": [ 365, 385 ] , "outputIndexes": [ 386 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/self_attn/v_proj/Linear", "inputIndexes": [ 2805 ] , "outputIndexes": [ 2814 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 12313994, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2814 ] , "outputIndexes": [ 2815 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2815 ] , "outputIndexes": [ 387 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_100_output_0", "inputIndexes": [ 326, 20 ] , "outputIndexes": [ 388 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_101_output_0", "inputIndexes": [ 334, 20 ] , "outputIndexes": [ 389 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_41_output_0", "inputIndexes": [ 388, 389, 77, 31 ] , "outputIndexes": [ 390 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_30_output_0", "inputIndexes": [ 387, 390 ] , "outputIndexes": [ 391 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_35_output_0", "inputIndexes": [ 359, 386, 391, 124 ] , "outputIndexes": [ 392 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 392 ] , "outputIndexes": [ 2816 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2816 ] , "outputIndexes": [ 2817 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/self_attn/o_proj/Linear", "inputIndexes": [ 2817 ] , "outputIndexes": [ 2818 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 12438672, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2818 ] , "outputIndexes": [ 2819 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2819 ] , "outputIndexes": [ 393 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_18_output_0", "inputIndexes": [ 313, 393 ] , "outputIndexes": [ 394 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_3/Mul_1_output_0", "inputIndexes": [ 394 ] , "outputIndexes": [ 395 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 12812182, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 395 ] , "outputIndexes": [ 2820 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2820 ] , "outputIndexes": [ 2821 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/mlp/gate_proj/Linear", "inputIndexes": [ 2821 ] , "outputIndexes": [ 2822 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 12816790, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2822 ] , "outputIndexes": [ 2823 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2823 ] , "outputIndexes": [ 396 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_3/Mul_output_0", "inputIndexes": [ 396 ] , "outputIndexes": [ 397 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/mlp/up_proj/Linear", "inputIndexes": [ 2821 ] , "outputIndexes": [ 2826 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 13812380, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2826 ] , "outputIndexes": [ 2827 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2827 ] , "outputIndexes": [ 398 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_3/Mul_output_0", "inputIndexes": [ 397, 398 ] , "outputIndexes": [ 399 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 399 ] , "outputIndexes": [ 2828 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2828 ] , "outputIndexes": [ 2829 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.3/mlp/down_proj/Linear", "inputIndexes": [ 2829 ] , "outputIndexes": [ 2830 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 14807970, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.3/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2830 ] , "outputIndexes": [ 2831 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2831 ] , "outputIndexes": [ 400 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_19_output_0", "inputIndexes": [ 394, 400 ] , "outputIndexes": [ 401 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_36_output_0", "inputIndexes": [ 401, 3 ] , "outputIndexes": [ 402 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_4/Mul_1_output_0", "inputIndexes": [ 402 ] , "outputIndexes": [ 403 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 15748264, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 403 ] , "outputIndexes": [ 2832 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2832 ] , "outputIndexes": [ 2833 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/self_attn/q_proj/Linear", "inputIndexes": [ 2833 ] , "outputIndexes": [ 2834 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 15752872, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2834 ] , "outputIndexes": [ 2835 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2835 ] , "outputIndexes": [ 404 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_56_output_0", "inputIndexes": [ 403 ] , "outputIndexes": [ 405 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1592", "inputIndexes": [ 405 ] , "outputIndexes": [ 406 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1594", "inputIndexes": [ 405 ] , "outputIndexes": [ 407 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1596", "inputIndexes": [ 407, 407 ] , "outputIndexes": [ 408 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1597", "inputIndexes": [ 408 ] , "outputIndexes": [ 409 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1599", "inputIndexes": [ 408, 12 ] , "outputIndexes": [ 410 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1600", "inputIndexes": [ 410 ] , "outputIndexes": [ 411 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1603", "inputIndexes": [ 406, 409, 411, 15 ] , "outputIndexes": [ 412 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1604", "inputIndexes": [ 412 ] , "outputIndexes": [ 413 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1606", "inputIndexes": [ 413, 413 ] , "outputIndexes": [ 414 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_63_output_0", "inputIndexes": [ 405, 414, 408 ] , "outputIndexes": [ 415 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_128_output_0", "inputIndexes": [ 415, 20 ] , "outputIndexes": [ 416 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1614", "inputIndexes": [ 408 ] , "outputIndexes": [ 417 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1617", "inputIndexes": [ 410 ] , "outputIndexes": [ 418 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1620", "inputIndexes": [ 406, 417, 418, 15 ] , "outputIndexes": [ 419 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1621", "inputIndexes": [ 419 ] , "outputIndexes": [ 420 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1622", "inputIndexes": [ 12, 420 ] , "outputIndexes": [ 421 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1623", "inputIndexes": [ 421, 420 ] , "outputIndexes": [ 422 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_64_output_0", "inputIndexes": [ 405, 422, 408 ] , "outputIndexes": [ 423 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_129_output_0", "inputIndexes": [ 423, 20 ] , "outputIndexes": [ 424 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_52_output_0", "inputIndexes": [ 416, 424, 30, 31 ] , "outputIndexes": [ 425 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_37_output_0", "inputIndexes": [ 404, 425 ] , "outputIndexes": [ 426 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_32_output_0", "inputIndexes": [ 426, 58 ] , "outputIndexes": [ 427 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_58_output_0", "inputIndexes": [ 426 ] , "outputIndexes": [ 428 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1724", "inputIndexes": [ 428 ] , "outputIndexes": [ 429 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1726", "inputIndexes": [ 428 ] , "outputIndexes": [ 430 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1728", "inputIndexes": [ 430, 430 ] , "outputIndexes": [ 431 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1729", "inputIndexes": [ 431 ] , "outputIndexes": [ 432 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1731", "inputIndexes": [ 431, 12 ] , "outputIndexes": [ 433 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1732", "inputIndexes": [ 433 ] , "outputIndexes": [ 434 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1735", "inputIndexes": [ 429, 432, 434, 15 ] , "outputIndexes": [ 435 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1736", "inputIndexes": [ 435 ] , "outputIndexes": [ 436 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1737", "inputIndexes": [ 61, 436 ] , "outputIndexes": [ 437 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1738", "inputIndexes": [ 437, 436 ] , "outputIndexes": [ 438 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_65_output_0", "inputIndexes": [ 428, 438, 431 ] , "outputIndexes": [ 439 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_12_output_0", "inputIndexes": [ 439, 73 ] , "outputIndexes": [ 440 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_135_output_0", "inputIndexes": [ 440, 20 ] , "outputIndexes": [ 441 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_17_output_0", "inputIndexes": [ 426, 441, 76, 77, 15 ] , "outputIndexes": [ 442 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_8_output_0", "inputIndexes": [ 442 ] , "outputIndexes": [ 443 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_134_output_0", "inputIndexes": [ 440, 20 ] , "outputIndexes": [ 444 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_16_output_0", "inputIndexes": [ 426, 20, 444, 77, 15 ] , "outputIndexes": [ 445 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_55_output_0", "inputIndexes": [ 443, 445 ] , "outputIndexes": [ 446 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_33_output_0", "inputIndexes": [ 446, 89 ] , "outputIndexes": [ 447 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_20_output_0", "inputIndexes": [ 427, 447 ] , "outputIndexes": [ 448 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/self_attn/k_proj/Linear", "inputIndexes": [ 2833 ] , "outputIndexes": [ 2838 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 16126382, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2838 ] , "outputIndexes": [ 2839 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2839 ] , "outputIndexes": [ 449 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_130_output_0", "inputIndexes": [ 415, 20 ] , "outputIndexes": [ 450 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_131_output_0", "inputIndexes": [ 423, 20 ] , "outputIndexes": [ 451 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_53_output_0", "inputIndexes": [ 450, 451, 77, 31 ] , "outputIndexes": [ 452 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_38_output_0", "inputIndexes": [ 449, 452 ] , "outputIndexes": [ 453 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_34_output_0", "inputIndexes": [ 453, 58 ] , "outputIndexes": [ 454 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_59_output_0", "inputIndexes": [ 453 ] , "outputIndexes": [ 455 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1630", "inputIndexes": [ 455 ] , "outputIndexes": [ 456 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1632", "inputIndexes": [ 455 ] , "outputIndexes": [ 457 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1634", "inputIndexes": [ 457, 457 ] , "outputIndexes": [ 458 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1635", "inputIndexes": [ 458 ] , "outputIndexes": [ 459 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1637", "inputIndexes": [ 458, 12 ] , "outputIndexes": [ 460 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1638", "inputIndexes": [ 460 ] , "outputIndexes": [ 461 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1641", "inputIndexes": [ 456, 459, 461, 15 ] , "outputIndexes": [ 462 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1642", "inputIndexes": [ 462 ] , "outputIndexes": [ 463 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1643", "inputIndexes": [ 61, 463 ] , "outputIndexes": [ 464 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1644", "inputIndexes": [ 464, 463 ] , "outputIndexes": [ 465 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_66_output_0", "inputIndexes": [ 455, 465, 458 ] , "outputIndexes": [ 466 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_13_output_0", "inputIndexes": [ 466, 73 ] , "outputIndexes": [ 467 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_137_output_0", "inputIndexes": [ 467, 20 ] , "outputIndexes": [ 468 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_19_output_0", "inputIndexes": [ 453, 468, 76, 77, 15 ] , "outputIndexes": [ 469 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_9_output_0", "inputIndexes": [ 469 ] , "outputIndexes": [ 470 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_136_output_0", "inputIndexes": [ 467, 20 ] , "outputIndexes": [ 471 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_18_output_0", "inputIndexes": [ 453, 20, 471, 77, 15 ] , "outputIndexes": [ 472 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_56_output_0", "inputIndexes": [ 470, 472 ] , "outputIndexes": [ 473 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_35_output_0", "inputIndexes": [ 473, 89 ] , "outputIndexes": [ 474 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_21_output_0", "inputIndexes": [ 454, 474 ] , "outputIndexes": [ 475 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/self_attn/v_proj/Linear", "inputIndexes": [ 2833 ] , "outputIndexes": [ 2842 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 16251060, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2842 ] , "outputIndexes": [ 2843 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2843 ] , "outputIndexes": [ 476 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_132_output_0", "inputIndexes": [ 415, 20 ] , "outputIndexes": [ 477 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_133_output_0", "inputIndexes": [ 423, 20 ] , "outputIndexes": [ 478 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_54_output_0", "inputIndexes": [ 477, 478, 77, 31 ] , "outputIndexes": [ 479 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_39_output_0", "inputIndexes": [ 476, 479 ] , "outputIndexes": [ 480 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_44_output_0", "inputIndexes": [ 448, 475, 480, 124 ] , "outputIndexes": [ 481 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 481 ] , "outputIndexes": [ 2844 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2844 ] , "outputIndexes": [ 2845 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/self_attn/o_proj/Linear", "inputIndexes": [ 2845 ] , "outputIndexes": [ 2846 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 16375738, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2846 ] , "outputIndexes": [ 2847 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2847 ] , "outputIndexes": [ 482 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_23_output_0", "inputIndexes": [ 402, 482 ] , "outputIndexes": [ 483 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_4/Mul_1_output_0", "inputIndexes": [ 483 ] , "outputIndexes": [ 484 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 16749248, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 484 ] , "outputIndexes": [ 2848 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2848 ] , "outputIndexes": [ 2849 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/mlp/gate_proj/Linear", "inputIndexes": [ 2849 ] , "outputIndexes": [ 2850 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 16753856, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2850 ] , "outputIndexes": [ 2851 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2851 ] , "outputIndexes": [ 485 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_4/Mul_output_0", "inputIndexes": [ 485 ] , "outputIndexes": [ 486 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/mlp/up_proj/Linear", "inputIndexes": [ 2849 ] , "outputIndexes": [ 2854 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 17749446, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2854 ] , "outputIndexes": [ 2855 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2855 ] , "outputIndexes": [ 487 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_4/Mul_output_0", "inputIndexes": [ 486, 487 ] , "outputIndexes": [ 488 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 488 ] , "outputIndexes": [ 2856 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2856 ] , "outputIndexes": [ 2857 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.4/mlp/down_proj/Linear", "inputIndexes": [ 2857 ] , "outputIndexes": [ 2858 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 18745036, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.4/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2858 ] , "outputIndexes": [ 2859 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2859 ] , "outputIndexes": [ 489 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_24_output_0", "inputIndexes": [ 483, 489 ] , "outputIndexes": [ 490 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_45_output_0", "inputIndexes": [ 490, 3 ] , "outputIndexes": [ 491 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_5/Mul_1_output_0", "inputIndexes": [ 491 ] , "outputIndexes": [ 492 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 19685330, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 492 ] , "outputIndexes": [ 2860 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2860 ] , "outputIndexes": [ 2861 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/self_attn/q_proj/Linear", "inputIndexes": [ 2861 ] , "outputIndexes": [ 2862 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19689938, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2862 ] , "outputIndexes": [ 2863 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2863 ] , "outputIndexes": [ 493 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_70_output_0", "inputIndexes": [ 492 ] , "outputIndexes": [ 494 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape1963", "inputIndexes": [ 494 ] , "outputIndexes": [ 495 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank1965", "inputIndexes": [ 494 ] , "outputIndexes": [ 496 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1967", "inputIndexes": [ 496, 496 ] , "outputIndexes": [ 497 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1968", "inputIndexes": [ 497 ] , "outputIndexes": [ 498 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1970", "inputIndexes": [ 497, 12 ] , "outputIndexes": [ 499 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1971", "inputIndexes": [ 499 ] , "outputIndexes": [ 500 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1974", "inputIndexes": [ 495, 498, 500, 15 ] , "outputIndexes": [ 501 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1975", "inputIndexes": [ 501 ] , "outputIndexes": [ 502 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1977", "inputIndexes": [ 502, 502 ] , "outputIndexes": [ 503 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_78_output_0", "inputIndexes": [ 494, 503, 497 ] , "outputIndexes": [ 504 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_160_output_0", "inputIndexes": [ 504, 20 ] , "outputIndexes": [ 505 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1985", "inputIndexes": [ 497 ] , "outputIndexes": [ 506 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze1988", "inputIndexes": [ 499 ] , "outputIndexes": [ 507 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice1991", "inputIndexes": [ 495, 506, 507, 15 ] , "outputIndexes": [ 508 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze1992", "inputIndexes": [ 508 ] , "outputIndexes": [ 509 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1993", "inputIndexes": [ 12, 509 ] , "outputIndexes": [ 510 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp1994", "inputIndexes": [ 510, 509 ] , "outputIndexes": [ 511 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_79_output_0", "inputIndexes": [ 494, 511, 497 ] , "outputIndexes": [ 512 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_161_output_0", "inputIndexes": [ 512, 20 ] , "outputIndexes": [ 513 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_65_output_0", "inputIndexes": [ 505, 513, 30, 31 ] , "outputIndexes": [ 514 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_46_output_0", "inputIndexes": [ 493, 514 ] , "outputIndexes": [ 515 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_40_output_0", "inputIndexes": [ 515, 58 ] , "outputIndexes": [ 516 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_72_output_0", "inputIndexes": [ 515 ] , "outputIndexes": [ 517 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2095", "inputIndexes": [ 517 ] , "outputIndexes": [ 518 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2097", "inputIndexes": [ 517 ] , "outputIndexes": [ 519 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2099", "inputIndexes": [ 519, 519 ] , "outputIndexes": [ 520 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2100", "inputIndexes": [ 520 ] , "outputIndexes": [ 521 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2102", "inputIndexes": [ 520, 12 ] , "outputIndexes": [ 522 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2103", "inputIndexes": [ 522 ] , "outputIndexes": [ 523 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2106", "inputIndexes": [ 518, 521, 523, 15 ] , "outputIndexes": [ 524 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2107", "inputIndexes": [ 524 ] , "outputIndexes": [ 525 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2108", "inputIndexes": [ 61, 525 ] , "outputIndexes": [ 526 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2109", "inputIndexes": [ 526, 525 ] , "outputIndexes": [ 527 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_80_output_0", "inputIndexes": [ 517, 527, 520 ] , "outputIndexes": [ 528 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_15_output_0", "inputIndexes": [ 528, 73 ] , "outputIndexes": [ 529 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_167_output_0", "inputIndexes": [ 529, 20 ] , "outputIndexes": [ 530 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_21_output_0", "inputIndexes": [ 515, 530, 76, 77, 15 ] , "outputIndexes": [ 531 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_10_output_0", "inputIndexes": [ 531 ] , "outputIndexes": [ 532 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_166_output_0", "inputIndexes": [ 529, 20 ] , "outputIndexes": [ 533 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_20_output_0", "inputIndexes": [ 515, 20, 533, 77, 15 ] , "outputIndexes": [ 534 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_68_output_0", "inputIndexes": [ 532, 534 ] , "outputIndexes": [ 535 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_41_output_0", "inputIndexes": [ 535, 89 ] , "outputIndexes": [ 536 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_25_output_0", "inputIndexes": [ 516, 536 ] , "outputIndexes": [ 537 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/self_attn/k_proj/Linear", "inputIndexes": [ 2861 ] , "outputIndexes": [ 2866 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20063448, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2866 ] , "outputIndexes": [ 2867 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2867 ] , "outputIndexes": [ 538 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_162_output_0", "inputIndexes": [ 504, 20 ] , "outputIndexes": [ 539 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_163_output_0", "inputIndexes": [ 512, 20 ] , "outputIndexes": [ 540 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_66_output_0", "inputIndexes": [ 539, 540, 77, 31 ] , "outputIndexes": [ 541 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_47_output_0", "inputIndexes": [ 538, 541 ] , "outputIndexes": [ 542 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_42_output_0", "inputIndexes": [ 542, 58 ] , "outputIndexes": [ 543 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_73_output_0", "inputIndexes": [ 542 ] , "outputIndexes": [ 544 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2001", "inputIndexes": [ 544 ] , "outputIndexes": [ 545 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2003", "inputIndexes": [ 544 ] , "outputIndexes": [ 546 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2005", "inputIndexes": [ 546, 546 ] , "outputIndexes": [ 547 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2006", "inputIndexes": [ 547 ] , "outputIndexes": [ 548 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2008", "inputIndexes": [ 547, 12 ] , "outputIndexes": [ 549 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2009", "inputIndexes": [ 549 ] , "outputIndexes": [ 550 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2012", "inputIndexes": [ 545, 548, 550, 15 ] , "outputIndexes": [ 551 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2013", "inputIndexes": [ 551 ] , "outputIndexes": [ 552 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2014", "inputIndexes": [ 61, 552 ] , "outputIndexes": [ 553 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2015", "inputIndexes": [ 553, 552 ] , "outputIndexes": [ 554 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_81_output_0", "inputIndexes": [ 544, 554, 547 ] , "outputIndexes": [ 555 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_16_output_0", "inputIndexes": [ 555, 73 ] , "outputIndexes": [ 556 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_169_output_0", "inputIndexes": [ 556, 20 ] , "outputIndexes": [ 557 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_23_output_0", "inputIndexes": [ 542, 557, 76, 77, 15 ] , "outputIndexes": [ 558 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_11_output_0", "inputIndexes": [ 558 ] , "outputIndexes": [ 559 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_168_output_0", "inputIndexes": [ 556, 20 ] , "outputIndexes": [ 560 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_22_output_0", "inputIndexes": [ 542, 20, 560, 77, 15 ] , "outputIndexes": [ 561 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_69_output_0", "inputIndexes": [ 559, 561 ] , "outputIndexes": [ 562 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_43_output_0", "inputIndexes": [ 562, 89 ] , "outputIndexes": [ 563 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_26_output_0", "inputIndexes": [ 543, 563 ] , "outputIndexes": [ 564 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/self_attn/v_proj/Linear", "inputIndexes": [ 2861 ] , "outputIndexes": [ 2870 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20188126, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2870 ] , "outputIndexes": [ 2871 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2871 ] , "outputIndexes": [ 565 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_164_output_0", "inputIndexes": [ 504, 20 ] , "outputIndexes": [ 566 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_165_output_0", "inputIndexes": [ 512, 20 ] , "outputIndexes": [ 567 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_67_output_0", "inputIndexes": [ 566, 567, 77, 31 ] , "outputIndexes": [ 568 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_48_output_0", "inputIndexes": [ 565, 568 ] , "outputIndexes": [ 569 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_53_output_0", "inputIndexes": [ 537, 564, 569, 124 ] , "outputIndexes": [ 570 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 570 ] , "outputIndexes": [ 2872 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2872 ] , "outputIndexes": [ 2873 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/self_attn/o_proj/Linear", "inputIndexes": [ 2873 ] , "outputIndexes": [ 2874 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20312804, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2874 ] , "outputIndexes": [ 2875 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2875 ] , "outputIndexes": [ 571 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_28_output_0", "inputIndexes": [ 491, 571 ] , "outputIndexes": [ 572 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_5/Mul_1_output_0", "inputIndexes": [ 572 ] , "outputIndexes": [ 573 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 20686314, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 573 ] , "outputIndexes": [ 2876 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2876 ] , "outputIndexes": [ 2877 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/mlp/gate_proj/Linear", "inputIndexes": [ 2877 ] , "outputIndexes": [ 2878 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 20690922, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2878 ] , "outputIndexes": [ 2879 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2879 ] , "outputIndexes": [ 574 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_5/Mul_output_0", "inputIndexes": [ 574 ] , "outputIndexes": [ 575 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/mlp/up_proj/Linear", "inputIndexes": [ 2877 ] , "outputIndexes": [ 2882 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 21686512, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2882 ] , "outputIndexes": [ 2883 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2883 ] , "outputIndexes": [ 576 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_5/Mul_output_0", "inputIndexes": [ 575, 576 ] , "outputIndexes": [ 577 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 577 ] , "outputIndexes": [ 2884 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2884 ] , "outputIndexes": [ 2885 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.5/mlp/down_proj/Linear", "inputIndexes": [ 2885 ] , "outputIndexes": [ 2886 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 22682102, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.5/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2886 ] , "outputIndexes": [ 2887 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2887 ] , "outputIndexes": [ 578 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_29_output_0", "inputIndexes": [ 572, 578 ] , "outputIndexes": [ 579 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_54_output_0", "inputIndexes": [ 579, 3 ] , "outputIndexes": [ 580 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_6/Mul_1_output_0", "inputIndexes": [ 580 ] , "outputIndexes": [ 581 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 23622396, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 581 ] , "outputIndexes": [ 2888 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2888 ] , "outputIndexes": [ 2889 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/self_attn/q_proj/Linear", "inputIndexes": [ 2889 ] , "outputIndexes": [ 2890 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 23627004, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2890 ] , "outputIndexes": [ 2891 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2891 ] , "outputIndexes": [ 582 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_84_output_0", "inputIndexes": [ 581 ] , "outputIndexes": [ 583 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2334", "inputIndexes": [ 583 ] , "outputIndexes": [ 584 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2336", "inputIndexes": [ 583 ] , "outputIndexes": [ 585 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2338", "inputIndexes": [ 585, 585 ] , "outputIndexes": [ 586 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2339", "inputIndexes": [ 586 ] , "outputIndexes": [ 587 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2341", "inputIndexes": [ 586, 12 ] , "outputIndexes": [ 588 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2342", "inputIndexes": [ 588 ] , "outputIndexes": [ 589 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2345", "inputIndexes": [ 584, 587, 589, 15 ] , "outputIndexes": [ 590 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2346", "inputIndexes": [ 590 ] , "outputIndexes": [ 591 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2348", "inputIndexes": [ 591, 591 ] , "outputIndexes": [ 592 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_93_output_0", "inputIndexes": [ 583, 592, 586 ] , "outputIndexes": [ 593 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_192_output_0", "inputIndexes": [ 593, 20 ] , "outputIndexes": [ 594 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2356", "inputIndexes": [ 586 ] , "outputIndexes": [ 595 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2359", "inputIndexes": [ 588 ] , "outputIndexes": [ 596 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2362", "inputIndexes": [ 584, 595, 596, 15 ] , "outputIndexes": [ 597 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2363", "inputIndexes": [ 597 ] , "outputIndexes": [ 598 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2364", "inputIndexes": [ 12, 598 ] , "outputIndexes": [ 599 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2365", "inputIndexes": [ 599, 598 ] , "outputIndexes": [ 600 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_94_output_0", "inputIndexes": [ 583, 600, 586 ] , "outputIndexes": [ 601 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_193_output_0", "inputIndexes": [ 601, 20 ] , "outputIndexes": [ 602 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_78_output_0", "inputIndexes": [ 594, 602, 30, 31 ] , "outputIndexes": [ 603 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_55_output_0", "inputIndexes": [ 582, 603 ] , "outputIndexes": [ 604 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_48_output_0", "inputIndexes": [ 604, 58 ] , "outputIndexes": [ 605 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_86_output_0", "inputIndexes": [ 604 ] , "outputIndexes": [ 606 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2466", "inputIndexes": [ 606 ] , "outputIndexes": [ 607 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2468", "inputIndexes": [ 606 ] , "outputIndexes": [ 608 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2470", "inputIndexes": [ 608, 608 ] , "outputIndexes": [ 609 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2471", "inputIndexes": [ 609 ] , "outputIndexes": [ 610 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2473", "inputIndexes": [ 609, 12 ] , "outputIndexes": [ 611 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2474", "inputIndexes": [ 611 ] , "outputIndexes": [ 612 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2477", "inputIndexes": [ 607, 610, 612, 15 ] , "outputIndexes": [ 613 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2478", "inputIndexes": [ 613 ] , "outputIndexes": [ 614 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2479", "inputIndexes": [ 61, 614 ] , "outputIndexes": [ 615 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2480", "inputIndexes": [ 615, 614 ] , "outputIndexes": [ 616 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_95_output_0", "inputIndexes": [ 606, 616, 609 ] , "outputIndexes": [ 617 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_18_output_0", "inputIndexes": [ 617, 73 ] , "outputIndexes": [ 618 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_199_output_0", "inputIndexes": [ 618, 20 ] , "outputIndexes": [ 619 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_25_output_0", "inputIndexes": [ 604, 619, 76, 77, 15 ] , "outputIndexes": [ 620 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_12_output_0", "inputIndexes": [ 620 ] , "outputIndexes": [ 621 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_198_output_0", "inputIndexes": [ 618, 20 ] , "outputIndexes": [ 622 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_24_output_0", "inputIndexes": [ 604, 20, 622, 77, 15 ] , "outputIndexes": [ 623 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_81_output_0", "inputIndexes": [ 621, 623 ] , "outputIndexes": [ 624 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_49_output_0", "inputIndexes": [ 624, 89 ] , "outputIndexes": [ 625 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_30_output_0", "inputIndexes": [ 605, 625 ] , "outputIndexes": [ 626 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/self_attn/k_proj/Linear", "inputIndexes": [ 2889 ] , "outputIndexes": [ 2894 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 24000514, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2894 ] , "outputIndexes": [ 2895 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2895 ] , "outputIndexes": [ 627 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_194_output_0", "inputIndexes": [ 593, 20 ] , "outputIndexes": [ 628 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_195_output_0", "inputIndexes": [ 601, 20 ] , "outputIndexes": [ 629 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_79_output_0", "inputIndexes": [ 628, 629, 77, 31 ] , "outputIndexes": [ 630 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_56_output_0", "inputIndexes": [ 627, 630 ] , "outputIndexes": [ 631 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_50_output_0", "inputIndexes": [ 631, 58 ] , "outputIndexes": [ 632 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_87_output_0", "inputIndexes": [ 631 ] , "outputIndexes": [ 633 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2372", "inputIndexes": [ 633 ] , "outputIndexes": [ 634 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2374", "inputIndexes": [ 633 ] , "outputIndexes": [ 635 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2376", "inputIndexes": [ 635, 635 ] , "outputIndexes": [ 636 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2377", "inputIndexes": [ 636 ] , "outputIndexes": [ 637 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2379", "inputIndexes": [ 636, 12 ] , "outputIndexes": [ 638 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2380", "inputIndexes": [ 638 ] , "outputIndexes": [ 639 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2383", "inputIndexes": [ 634, 637, 639, 15 ] , "outputIndexes": [ 640 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2384", "inputIndexes": [ 640 ] , "outputIndexes": [ 641 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2385", "inputIndexes": [ 61, 641 ] , "outputIndexes": [ 642 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2386", "inputIndexes": [ 642, 641 ] , "outputIndexes": [ 643 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_96_output_0", "inputIndexes": [ 633, 643, 636 ] , "outputIndexes": [ 644 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_19_output_0", "inputIndexes": [ 644, 73 ] , "outputIndexes": [ 645 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_201_output_0", "inputIndexes": [ 645, 20 ] , "outputIndexes": [ 646 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_27_output_0", "inputIndexes": [ 631, 646, 76, 77, 15 ] , "outputIndexes": [ 647 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_13_output_0", "inputIndexes": [ 647 ] , "outputIndexes": [ 648 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_200_output_0", "inputIndexes": [ 645, 20 ] , "outputIndexes": [ 649 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_26_output_0", "inputIndexes": [ 631, 20, 649, 77, 15 ] , "outputIndexes": [ 650 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_82_output_0", "inputIndexes": [ 648, 650 ] , "outputIndexes": [ 651 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_51_output_0", "inputIndexes": [ 651, 89 ] , "outputIndexes": [ 652 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_31_output_0", "inputIndexes": [ 632, 652 ] , "outputIndexes": [ 653 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/self_attn/v_proj/Linear", "inputIndexes": [ 2889 ] , "outputIndexes": [ 2898 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 24125192, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2898 ] , "outputIndexes": [ 2899 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2899 ] , "outputIndexes": [ 654 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_196_output_0", "inputIndexes": [ 593, 20 ] , "outputIndexes": [ 655 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_197_output_0", "inputIndexes": [ 601, 20 ] , "outputIndexes": [ 656 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_80_output_0", "inputIndexes": [ 655, 656, 77, 31 ] , "outputIndexes": [ 657 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_57_output_0", "inputIndexes": [ 654, 657 ] , "outputIndexes": [ 658 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_62_output_0", "inputIndexes": [ 626, 653, 658, 124 ] , "outputIndexes": [ 659 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 659 ] , "outputIndexes": [ 2900 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2900 ] , "outputIndexes": [ 2901 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/self_attn/o_proj/Linear", "inputIndexes": [ 2901 ] , "outputIndexes": [ 2902 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 24249870, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2902 ] , "outputIndexes": [ 2903 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2903 ] , "outputIndexes": [ 660 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_33_output_0", "inputIndexes": [ 580, 660 ] , "outputIndexes": [ 661 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_6/Mul_1_output_0", "inputIndexes": [ 661 ] , "outputIndexes": [ 662 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 24623380, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 662 ] , "outputIndexes": [ 2904 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2904 ] , "outputIndexes": [ 2905 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/mlp/gate_proj/Linear", "inputIndexes": [ 2905 ] , "outputIndexes": [ 2906 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 24627988, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2906 ] , "outputIndexes": [ 2907 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2907 ] , "outputIndexes": [ 663 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_6/Mul_output_0", "inputIndexes": [ 663 ] , "outputIndexes": [ 664 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/mlp/up_proj/Linear", "inputIndexes": [ 2905 ] , "outputIndexes": [ 2910 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 25623578, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2910 ] , "outputIndexes": [ 2911 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2911 ] , "outputIndexes": [ 665 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_6/Mul_output_0", "inputIndexes": [ 664, 665 ] , "outputIndexes": [ 666 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 666 ] , "outputIndexes": [ 2912 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2912 ] , "outputIndexes": [ 2913 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.6/mlp/down_proj/Linear", "inputIndexes": [ 2913 ] , "outputIndexes": [ 2914 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 26619168, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.6/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2914 ] , "outputIndexes": [ 2915 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2915 ] , "outputIndexes": [ 667 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_34_output_0", "inputIndexes": [ 661, 667 ] , "outputIndexes": [ 668 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_63_output_0", "inputIndexes": [ 668, 3 ] , "outputIndexes": [ 669 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_7/Mul_1_output_0", "inputIndexes": [ 669 ] , "outputIndexes": [ 670 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 27559462, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 670 ] , "outputIndexes": [ 2916 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2916 ] , "outputIndexes": [ 2917 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/self_attn/q_proj/Linear", "inputIndexes": [ 2917 ] , "outputIndexes": [ 2918 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 27564070, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2918 ] , "outputIndexes": [ 2919 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2919 ] , "outputIndexes": [ 671 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_98_output_0", "inputIndexes": [ 670 ] , "outputIndexes": [ 672 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2705", "inputIndexes": [ 672 ] , "outputIndexes": [ 673 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2707", "inputIndexes": [ 672 ] , "outputIndexes": [ 674 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2709", "inputIndexes": [ 674, 674 ] , "outputIndexes": [ 675 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2710", "inputIndexes": [ 675 ] , "outputIndexes": [ 676 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2712", "inputIndexes": [ 675, 12 ] , "outputIndexes": [ 677 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2713", "inputIndexes": [ 677 ] , "outputIndexes": [ 678 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2716", "inputIndexes": [ 673, 676, 678, 15 ] , "outputIndexes": [ 679 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2717", "inputIndexes": [ 679 ] , "outputIndexes": [ 680 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2719", "inputIndexes": [ 680, 680 ] , "outputIndexes": [ 681 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_108_output_0", "inputIndexes": [ 672, 681, 675 ] , "outputIndexes": [ 682 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_224_output_0", "inputIndexes": [ 682, 20 ] , "outputIndexes": [ 683 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2727", "inputIndexes": [ 675 ] , "outputIndexes": [ 684 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2730", "inputIndexes": [ 677 ] , "outputIndexes": [ 685 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2733", "inputIndexes": [ 673, 684, 685, 15 ] , "outputIndexes": [ 686 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2734", "inputIndexes": [ 686 ] , "outputIndexes": [ 687 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2735", "inputIndexes": [ 12, 687 ] , "outputIndexes": [ 688 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2736", "inputIndexes": [ 688, 687 ] , "outputIndexes": [ 689 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_109_output_0", "inputIndexes": [ 672, 689, 675 ] , "outputIndexes": [ 690 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_225_output_0", "inputIndexes": [ 690, 20 ] , "outputIndexes": [ 691 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_91_output_0", "inputIndexes": [ 683, 691, 30, 31 ] , "outputIndexes": [ 692 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_64_output_0", "inputIndexes": [ 671, 692 ] , "outputIndexes": [ 693 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_56_output_0", "inputIndexes": [ 693, 58 ] , "outputIndexes": [ 694 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_100_output_0", "inputIndexes": [ 693 ] , "outputIndexes": [ 695 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2837", "inputIndexes": [ 695 ] , "outputIndexes": [ 696 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2839", "inputIndexes": [ 695 ] , "outputIndexes": [ 697 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2841", "inputIndexes": [ 697, 697 ] , "outputIndexes": [ 698 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2842", "inputIndexes": [ 698 ] , "outputIndexes": [ 699 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2844", "inputIndexes": [ 698, 12 ] , "outputIndexes": [ 700 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2845", "inputIndexes": [ 700 ] , "outputIndexes": [ 701 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2848", "inputIndexes": [ 696, 699, 701, 15 ] , "outputIndexes": [ 702 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2849", "inputIndexes": [ 702 ] , "outputIndexes": [ 703 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2850", "inputIndexes": [ 61, 703 ] , "outputIndexes": [ 704 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2851", "inputIndexes": [ 704, 703 ] , "outputIndexes": [ 705 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_110_output_0", "inputIndexes": [ 695, 705, 698 ] , "outputIndexes": [ 706 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_21_output_0", "inputIndexes": [ 706, 73 ] , "outputIndexes": [ 707 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_231_output_0", "inputIndexes": [ 707, 20 ] , "outputIndexes": [ 708 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_29_output_0", "inputIndexes": [ 693, 708, 76, 77, 15 ] , "outputIndexes": [ 709 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_14_output_0", "inputIndexes": [ 709 ] , "outputIndexes": [ 710 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_230_output_0", "inputIndexes": [ 707, 20 ] , "outputIndexes": [ 711 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_28_output_0", "inputIndexes": [ 693, 20, 711, 77, 15 ] , "outputIndexes": [ 712 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_94_output_0", "inputIndexes": [ 710, 712 ] , "outputIndexes": [ 713 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_57_output_0", "inputIndexes": [ 713, 89 ] , "outputIndexes": [ 714 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_35_output_0", "inputIndexes": [ 694, 714 ] , "outputIndexes": [ 715 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/self_attn/k_proj/Linear", "inputIndexes": [ 2917 ] , "outputIndexes": [ 2922 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 27937580, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2922 ] , "outputIndexes": [ 2923 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2923 ] , "outputIndexes": [ 716 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_226_output_0", "inputIndexes": [ 682, 20 ] , "outputIndexes": [ 717 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_227_output_0", "inputIndexes": [ 690, 20 ] , "outputIndexes": [ 718 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_92_output_0", "inputIndexes": [ 717, 718, 77, 31 ] , "outputIndexes": [ 719 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_65_output_0", "inputIndexes": [ 716, 719 ] , "outputIndexes": [ 720 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_58_output_0", "inputIndexes": [ 720, 58 ] , "outputIndexes": [ 721 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_101_output_0", "inputIndexes": [ 720 ] , "outputIndexes": [ 722 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape2743", "inputIndexes": [ 722 ] , "outputIndexes": [ 723 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank2745", "inputIndexes": [ 722 ] , "outputIndexes": [ 724 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2747", "inputIndexes": [ 724, 724 ] , "outputIndexes": [ 725 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2748", "inputIndexes": [ 725 ] , "outputIndexes": [ 726 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2750", "inputIndexes": [ 725, 12 ] , "outputIndexes": [ 727 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze2751", "inputIndexes": [ 727 ] , "outputIndexes": [ 728 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice2754", "inputIndexes": [ 723, 726, 728, 15 ] , "outputIndexes": [ 729 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze2755", "inputIndexes": [ 729 ] , "outputIndexes": [ 730 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2756", "inputIndexes": [ 61, 730 ] , "outputIndexes": [ 731 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp2757", "inputIndexes": [ 731, 730 ] , "outputIndexes": [ 732 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_111_output_0", "inputIndexes": [ 722, 732, 725 ] , "outputIndexes": [ 733 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_22_output_0", "inputIndexes": [ 733, 73 ] , "outputIndexes": [ 734 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_233_output_0", "inputIndexes": [ 734, 20 ] , "outputIndexes": [ 735 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_31_output_0", "inputIndexes": [ 720, 735, 76, 77, 15 ] , "outputIndexes": [ 736 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_15_output_0", "inputIndexes": [ 736 ] , "outputIndexes": [ 737 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_232_output_0", "inputIndexes": [ 734, 20 ] , "outputIndexes": [ 738 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_30_output_0", "inputIndexes": [ 720, 20, 738, 77, 15 ] , "outputIndexes": [ 739 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_95_output_0", "inputIndexes": [ 737, 739 ] , "outputIndexes": [ 740 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_59_output_0", "inputIndexes": [ 740, 89 ] , "outputIndexes": [ 741 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_36_output_0", "inputIndexes": [ 721, 741 ] , "outputIndexes": [ 742 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/self_attn/v_proj/Linear", "inputIndexes": [ 2917 ] , "outputIndexes": [ 2926 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28062258, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2926 ] , "outputIndexes": [ 2927 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2927 ] , "outputIndexes": [ 743 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_228_output_0", "inputIndexes": [ 682, 20 ] , "outputIndexes": [ 744 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_229_output_0", "inputIndexes": [ 690, 20 ] , "outputIndexes": [ 745 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_93_output_0", "inputIndexes": [ 744, 745, 77, 31 ] , "outputIndexes": [ 746 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_66_output_0", "inputIndexes": [ 743, 746 ] , "outputIndexes": [ 747 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_71_output_0", "inputIndexes": [ 715, 742, 747, 124 ] , "outputIndexes": [ 748 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 748 ] , "outputIndexes": [ 2928 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2928 ] , "outputIndexes": [ 2929 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/self_attn/o_proj/Linear", "inputIndexes": [ 2929 ] , "outputIndexes": [ 2930 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28186936, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2930 ] , "outputIndexes": [ 2931 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2931 ] , "outputIndexes": [ 749 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_38_output_0", "inputIndexes": [ 669, 749 ] , "outputIndexes": [ 750 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_7/Mul_1_output_0", "inputIndexes": [ 750 ] , "outputIndexes": [ 751 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 28560446, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 751 ] , "outputIndexes": [ 2932 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2932 ] , "outputIndexes": [ 2933 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/mlp/gate_proj/Linear", "inputIndexes": [ 2933 ] , "outputIndexes": [ 2934 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28565054, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2934 ] , "outputIndexes": [ 2935 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2935 ] , "outputIndexes": [ 752 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_7/Mul_output_0", "inputIndexes": [ 752 ] , "outputIndexes": [ 753 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/mlp/up_proj/Linear", "inputIndexes": [ 2933 ] , "outputIndexes": [ 2938 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 29560644, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2938 ] , "outputIndexes": [ 2939 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2939 ] , "outputIndexes": [ 754 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_7/Mul_output_0", "inputIndexes": [ 753, 754 ] , "outputIndexes": [ 755 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 755 ] , "outputIndexes": [ 2940 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2940 ] , "outputIndexes": [ 2941 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.7/mlp/down_proj/Linear", "inputIndexes": [ 2941 ] , "outputIndexes": [ 2942 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 30556234, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.7/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2942 ] , "outputIndexes": [ 2943 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2943 ] , "outputIndexes": [ 756 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_39_output_0", "inputIndexes": [ 750, 756 ] , "outputIndexes": [ 757 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_72_output_0", "inputIndexes": [ 757, 3 ] , "outputIndexes": [ 758 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_8/Mul_1_output_0", "inputIndexes": [ 758 ] , "outputIndexes": [ 759 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 31496528, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 759 ] , "outputIndexes": [ 2944 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2944 ] , "outputIndexes": [ 2945 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/self_attn/q_proj/Linear", "inputIndexes": [ 2945 ] , "outputIndexes": [ 2946 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31501136, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2946 ] , "outputIndexes": [ 2947 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2947 ] , "outputIndexes": [ 760 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_112_output_0", "inputIndexes": [ 759 ] , "outputIndexes": [ 761 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3076", "inputIndexes": [ 761 ] , "outputIndexes": [ 762 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3078", "inputIndexes": [ 761 ] , "outputIndexes": [ 763 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3080", "inputIndexes": [ 763, 763 ] , "outputIndexes": [ 764 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3081", "inputIndexes": [ 764 ] , "outputIndexes": [ 765 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3083", "inputIndexes": [ 764, 12 ] , "outputIndexes": [ 766 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3084", "inputIndexes": [ 766 ] , "outputIndexes": [ 767 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3087", "inputIndexes": [ 762, 765, 767, 15 ] , "outputIndexes": [ 768 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3088", "inputIndexes": [ 768 ] , "outputIndexes": [ 769 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3090", "inputIndexes": [ 769, 769 ] , "outputIndexes": [ 770 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_123_output_0", "inputIndexes": [ 761, 770, 764 ] , "outputIndexes": [ 771 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_256_output_0", "inputIndexes": [ 771, 20 ] , "outputIndexes": [ 772 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3098", "inputIndexes": [ 764 ] , "outputIndexes": [ 773 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3101", "inputIndexes": [ 766 ] , "outputIndexes": [ 774 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3104", "inputIndexes": [ 762, 773, 774, 15 ] , "outputIndexes": [ 775 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3105", "inputIndexes": [ 775 ] , "outputIndexes": [ 776 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3106", "inputIndexes": [ 12, 776 ] , "outputIndexes": [ 777 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3107", "inputIndexes": [ 777, 776 ] , "outputIndexes": [ 778 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_124_output_0", "inputIndexes": [ 761, 778, 764 ] , "outputIndexes": [ 779 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_257_output_0", "inputIndexes": [ 779, 20 ] , "outputIndexes": [ 780 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_104_output_0", "inputIndexes": [ 772, 780, 30, 31 ] , "outputIndexes": [ 781 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_73_output_0", "inputIndexes": [ 760, 781 ] , "outputIndexes": [ 782 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_64_output_0", "inputIndexes": [ 782, 58 ] , "outputIndexes": [ 783 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_114_output_0", "inputIndexes": [ 782 ] , "outputIndexes": [ 784 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3208", "inputIndexes": [ 784 ] , "outputIndexes": [ 785 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3210", "inputIndexes": [ 784 ] , "outputIndexes": [ 786 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3212", "inputIndexes": [ 786, 786 ] , "outputIndexes": [ 787 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3213", "inputIndexes": [ 787 ] , "outputIndexes": [ 788 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3215", "inputIndexes": [ 787, 12 ] , "outputIndexes": [ 789 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3216", "inputIndexes": [ 789 ] , "outputIndexes": [ 790 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3219", "inputIndexes": [ 785, 788, 790, 15 ] , "outputIndexes": [ 791 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3220", "inputIndexes": [ 791 ] , "outputIndexes": [ 792 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3221", "inputIndexes": [ 61, 792 ] , "outputIndexes": [ 793 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3222", "inputIndexes": [ 793, 792 ] , "outputIndexes": [ 794 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_125_output_0", "inputIndexes": [ 784, 794, 787 ] , "outputIndexes": [ 795 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_24_output_0", "inputIndexes": [ 795, 73 ] , "outputIndexes": [ 796 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_263_output_0", "inputIndexes": [ 796, 20 ] , "outputIndexes": [ 797 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_33_output_0", "inputIndexes": [ 782, 797, 76, 77, 15 ] , "outputIndexes": [ 798 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_16_output_0", "inputIndexes": [ 798 ] , "outputIndexes": [ 799 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_262_output_0", "inputIndexes": [ 796, 20 ] , "outputIndexes": [ 800 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_32_output_0", "inputIndexes": [ 782, 20, 800, 77, 15 ] , "outputIndexes": [ 801 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_107_output_0", "inputIndexes": [ 799, 801 ] , "outputIndexes": [ 802 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_65_output_0", "inputIndexes": [ 802, 89 ] , "outputIndexes": [ 803 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_40_output_0", "inputIndexes": [ 783, 803 ] , "outputIndexes": [ 804 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/self_attn/k_proj/Linear", "inputIndexes": [ 2945 ] , "outputIndexes": [ 2950 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31874646, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2950 ] , "outputIndexes": [ 2951 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2951 ] , "outputIndexes": [ 805 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_258_output_0", "inputIndexes": [ 771, 20 ] , "outputIndexes": [ 806 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_259_output_0", "inputIndexes": [ 779, 20 ] , "outputIndexes": [ 807 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_105_output_0", "inputIndexes": [ 806, 807, 77, 31 ] , "outputIndexes": [ 808 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_74_output_0", "inputIndexes": [ 805, 808 ] , "outputIndexes": [ 809 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_66_output_0", "inputIndexes": [ 809, 58 ] , "outputIndexes": [ 810 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_115_output_0", "inputIndexes": [ 809 ] , "outputIndexes": [ 811 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3114", "inputIndexes": [ 811 ] , "outputIndexes": [ 812 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3116", "inputIndexes": [ 811 ] , "outputIndexes": [ 813 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3118", "inputIndexes": [ 813, 813 ] , "outputIndexes": [ 814 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3119", "inputIndexes": [ 814 ] , "outputIndexes": [ 815 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3121", "inputIndexes": [ 814, 12 ] , "outputIndexes": [ 816 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3122", "inputIndexes": [ 816 ] , "outputIndexes": [ 817 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3125", "inputIndexes": [ 812, 815, 817, 15 ] , "outputIndexes": [ 818 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3126", "inputIndexes": [ 818 ] , "outputIndexes": [ 819 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3127", "inputIndexes": [ 61, 819 ] , "outputIndexes": [ 820 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3128", "inputIndexes": [ 820, 819 ] , "outputIndexes": [ 821 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_126_output_0", "inputIndexes": [ 811, 821, 814 ] , "outputIndexes": [ 822 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_25_output_0", "inputIndexes": [ 822, 73 ] , "outputIndexes": [ 823 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_265_output_0", "inputIndexes": [ 823, 20 ] , "outputIndexes": [ 824 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_35_output_0", "inputIndexes": [ 809, 824, 76, 77, 15 ] , "outputIndexes": [ 825 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_17_output_0", "inputIndexes": [ 825 ] , "outputIndexes": [ 826 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_264_output_0", "inputIndexes": [ 823, 20 ] , "outputIndexes": [ 827 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_34_output_0", "inputIndexes": [ 809, 20, 827, 77, 15 ] , "outputIndexes": [ 828 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_108_output_0", "inputIndexes": [ 826, 828 ] , "outputIndexes": [ 829 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_67_output_0", "inputIndexes": [ 829, 89 ] , "outputIndexes": [ 830 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_41_output_0", "inputIndexes": [ 810, 830 ] , "outputIndexes": [ 831 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/self_attn/v_proj/Linear", "inputIndexes": [ 2945 ] , "outputIndexes": [ 2954 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31999324, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2954 ] , "outputIndexes": [ 2955 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2955 ] , "outputIndexes": [ 832 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_260_output_0", "inputIndexes": [ 771, 20 ] , "outputIndexes": [ 833 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_261_output_0", "inputIndexes": [ 779, 20 ] , "outputIndexes": [ 834 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_106_output_0", "inputIndexes": [ 833, 834, 77, 31 ] , "outputIndexes": [ 835 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_75_output_0", "inputIndexes": [ 832, 835 ] , "outputIndexes": [ 836 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_80_output_0", "inputIndexes": [ 804, 831, 836, 124 ] , "outputIndexes": [ 837 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 837 ] , "outputIndexes": [ 2956 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2956 ] , "outputIndexes": [ 2957 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/self_attn/o_proj/Linear", "inputIndexes": [ 2957 ] , "outputIndexes": [ 2958 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 32124002, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2958 ] , "outputIndexes": [ 2959 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2959 ] , "outputIndexes": [ 838 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_43_output_0", "inputIndexes": [ 758, 838 ] , "outputIndexes": [ 839 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_8/Mul_1_output_0", "inputIndexes": [ 839 ] , "outputIndexes": [ 840 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 32497512, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 840 ] , "outputIndexes": [ 2960 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2960 ] , "outputIndexes": [ 2961 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/mlp/gate_proj/Linear", "inputIndexes": [ 2961 ] , "outputIndexes": [ 2962 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 32502120, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2962 ] , "outputIndexes": [ 2963 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2963 ] , "outputIndexes": [ 841 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_8/Mul_output_0", "inputIndexes": [ 841 ] , "outputIndexes": [ 842 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/mlp/up_proj/Linear", "inputIndexes": [ 2961 ] , "outputIndexes": [ 2966 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 33497710, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2966 ] , "outputIndexes": [ 2967 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2967 ] , "outputIndexes": [ 843 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_8/Mul_output_0", "inputIndexes": [ 842, 843 ] , "outputIndexes": [ 844 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 844 ] , "outputIndexes": [ 2968 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2968 ] , "outputIndexes": [ 2969 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.8/mlp/down_proj/Linear", "inputIndexes": [ 2969 ] , "outputIndexes": [ 2970 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 34493300, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.8/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2970 ] , "outputIndexes": [ 2971 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2971 ] , "outputIndexes": [ 845 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_44_output_0", "inputIndexes": [ 839, 845 ] , "outputIndexes": [ 846 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_81_output_0", "inputIndexes": [ 846, 3 ] , "outputIndexes": [ 847 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_9/Mul_1_output_0", "inputIndexes": [ 847 ] , "outputIndexes": [ 848 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 35433594, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 848 ] , "outputIndexes": [ 2972 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 2972 ] , "outputIndexes": [ 2973 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/self_attn/q_proj/Linear", "inputIndexes": [ 2973 ] , "outputIndexes": [ 2974 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 35438202, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 2974 ] , "outputIndexes": [ 2975 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 2975 ] , "outputIndexes": [ 849 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_126_output_0", "inputIndexes": [ 848 ] , "outputIndexes": [ 850 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3447", "inputIndexes": [ 850 ] , "outputIndexes": [ 851 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3449", "inputIndexes": [ 850 ] , "outputIndexes": [ 852 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3451", "inputIndexes": [ 852, 852 ] , "outputIndexes": [ 853 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3452", "inputIndexes": [ 853 ] , "outputIndexes": [ 854 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3454", "inputIndexes": [ 853, 12 ] , "outputIndexes": [ 855 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3455", "inputIndexes": [ 855 ] , "outputIndexes": [ 856 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3458", "inputIndexes": [ 851, 854, 856, 15 ] , "outputIndexes": [ 857 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3459", "inputIndexes": [ 857 ] , "outputIndexes": [ 858 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3461", "inputIndexes": [ 858, 858 ] , "outputIndexes": [ 859 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_138_output_0", "inputIndexes": [ 850, 859, 853 ] , "outputIndexes": [ 860 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_288_output_0", "inputIndexes": [ 860, 20 ] , "outputIndexes": [ 861 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3469", "inputIndexes": [ 853 ] , "outputIndexes": [ 862 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3472", "inputIndexes": [ 855 ] , "outputIndexes": [ 863 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3475", "inputIndexes": [ 851, 862, 863, 15 ] , "outputIndexes": [ 864 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3476", "inputIndexes": [ 864 ] , "outputIndexes": [ 865 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3477", "inputIndexes": [ 12, 865 ] , "outputIndexes": [ 866 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3478", "inputIndexes": [ 866, 865 ] , "outputIndexes": [ 867 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_139_output_0", "inputIndexes": [ 850, 867, 853 ] , "outputIndexes": [ 868 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_289_output_0", "inputIndexes": [ 868, 20 ] , "outputIndexes": [ 869 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_117_output_0", "inputIndexes": [ 861, 869, 30, 31 ] , "outputIndexes": [ 870 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_82_output_0", "inputIndexes": [ 849, 870 ] , "outputIndexes": [ 871 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_72_output_0", "inputIndexes": [ 871, 58 ] , "outputIndexes": [ 872 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_128_output_0", "inputIndexes": [ 871 ] , "outputIndexes": [ 873 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3579", "inputIndexes": [ 873 ] , "outputIndexes": [ 874 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3581", "inputIndexes": [ 873 ] , "outputIndexes": [ 875 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3583", "inputIndexes": [ 875, 875 ] , "outputIndexes": [ 876 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3584", "inputIndexes": [ 876 ] , "outputIndexes": [ 877 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3586", "inputIndexes": [ 876, 12 ] , "outputIndexes": [ 878 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3587", "inputIndexes": [ 878 ] , "outputIndexes": [ 879 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3590", "inputIndexes": [ 874, 877, 879, 15 ] , "outputIndexes": [ 880 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3591", "inputIndexes": [ 880 ] , "outputIndexes": [ 881 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3592", "inputIndexes": [ 61, 881 ] , "outputIndexes": [ 882 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3593", "inputIndexes": [ 882, 881 ] , "outputIndexes": [ 883 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_140_output_0", "inputIndexes": [ 873, 883, 876 ] , "outputIndexes": [ 884 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_27_output_0", "inputIndexes": [ 884, 73 ] , "outputIndexes": [ 885 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_295_output_0", "inputIndexes": [ 885, 20 ] , "outputIndexes": [ 886 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_37_output_0", "inputIndexes": [ 871, 886, 76, 77, 15 ] , "outputIndexes": [ 887 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_18_output_0", "inputIndexes": [ 887 ] , "outputIndexes": [ 888 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_294_output_0", "inputIndexes": [ 885, 20 ] , "outputIndexes": [ 889 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_36_output_0", "inputIndexes": [ 871, 20, 889, 77, 15 ] , "outputIndexes": [ 890 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_120_output_0", "inputIndexes": [ 888, 890 ] , "outputIndexes": [ 891 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_73_output_0", "inputIndexes": [ 891, 89 ] , "outputIndexes": [ 892 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_45_output_0", "inputIndexes": [ 872, 892 ] , "outputIndexes": [ 893 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/self_attn/k_proj/Linear", "inputIndexes": [ 2973 ] , "outputIndexes": [ 2978 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 35811712, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 2978 ] , "outputIndexes": [ 2979 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 2979 ] , "outputIndexes": [ 894 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_290_output_0", "inputIndexes": [ 860, 20 ] , "outputIndexes": [ 895 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_291_output_0", "inputIndexes": [ 868, 20 ] , "outputIndexes": [ 896 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_118_output_0", "inputIndexes": [ 895, 896, 77, 31 ] , "outputIndexes": [ 897 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_83_output_0", "inputIndexes": [ 894, 897 ] , "outputIndexes": [ 898 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_74_output_0", "inputIndexes": [ 898, 58 ] , "outputIndexes": [ 899 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_129_output_0", "inputIndexes": [ 898 ] , "outputIndexes": [ 900 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3485", "inputIndexes": [ 900 ] , "outputIndexes": [ 901 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3487", "inputIndexes": [ 900 ] , "outputIndexes": [ 902 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3489", "inputIndexes": [ 902, 902 ] , "outputIndexes": [ 903 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3490", "inputIndexes": [ 903 ] , "outputIndexes": [ 904 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3492", "inputIndexes": [ 903, 12 ] , "outputIndexes": [ 905 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3493", "inputIndexes": [ 905 ] , "outputIndexes": [ 906 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3496", "inputIndexes": [ 901, 904, 906, 15 ] , "outputIndexes": [ 907 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3497", "inputIndexes": [ 907 ] , "outputIndexes": [ 908 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3498", "inputIndexes": [ 61, 908 ] , "outputIndexes": [ 909 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3499", "inputIndexes": [ 909, 908 ] , "outputIndexes": [ 910 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_141_output_0", "inputIndexes": [ 900, 910, 903 ] , "outputIndexes": [ 911 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_28_output_0", "inputIndexes": [ 911, 73 ] , "outputIndexes": [ 912 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_297_output_0", "inputIndexes": [ 912, 20 ] , "outputIndexes": [ 913 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_39_output_0", "inputIndexes": [ 898, 913, 76, 77, 15 ] , "outputIndexes": [ 914 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_19_output_0", "inputIndexes": [ 914 ] , "outputIndexes": [ 915 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_296_output_0", "inputIndexes": [ 912, 20 ] , "outputIndexes": [ 916 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_38_output_0", "inputIndexes": [ 898, 20, 916, 77, 15 ] , "outputIndexes": [ 917 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_121_output_0", "inputIndexes": [ 915, 917 ] , "outputIndexes": [ 918 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_75_output_0", "inputIndexes": [ 918, 89 ] , "outputIndexes": [ 919 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_46_output_0", "inputIndexes": [ 899, 919 ] , "outputIndexes": [ 920 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/self_attn/v_proj/Linear", "inputIndexes": [ 2973 ] , "outputIndexes": [ 2982 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 35936390, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 2982 ] , "outputIndexes": [ 2983 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 2983 ] , "outputIndexes": [ 921 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_292_output_0", "inputIndexes": [ 860, 20 ] , "outputIndexes": [ 922 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_293_output_0", "inputIndexes": [ 868, 20 ] , "outputIndexes": [ 923 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_119_output_0", "inputIndexes": [ 922, 923, 77, 31 ] , "outputIndexes": [ 924 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_84_output_0", "inputIndexes": [ 921, 924 ] , "outputIndexes": [ 925 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_89_output_0", "inputIndexes": [ 893, 920, 925, 124 ] , "outputIndexes": [ 926 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 926 ] , "outputIndexes": [ 2984 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 2984 ] , "outputIndexes": [ 2985 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/self_attn/o_proj/Linear", "inputIndexes": [ 2985 ] , "outputIndexes": [ 2986 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 36061068, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 2986 ] , "outputIndexes": [ 2987 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 2987 ] , "outputIndexes": [ 927 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_48_output_0", "inputIndexes": [ 847, 927 ] , "outputIndexes": [ 928 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_9/Mul_1_output_0", "inputIndexes": [ 928 ] , "outputIndexes": [ 929 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 36434578, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 929 ] , "outputIndexes": [ 2988 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 2988 ] , "outputIndexes": [ 2989 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/mlp/gate_proj/Linear", "inputIndexes": [ 2989 ] , "outputIndexes": [ 2990 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 36439186, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 2990 ] , "outputIndexes": [ 2991 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 2991 ] , "outputIndexes": [ 930 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_9/Mul_output_0", "inputIndexes": [ 930 ] , "outputIndexes": [ 931 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/mlp/up_proj/Linear", "inputIndexes": [ 2989 ] , "outputIndexes": [ 2994 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37434776, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 2994 ] , "outputIndexes": [ 2995 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 2995 ] , "outputIndexes": [ 932 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_9/Mul_output_0", "inputIndexes": [ 931, 932 ] , "outputIndexes": [ 933 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 933 ] , "outputIndexes": [ 2996 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 2996 ] , "outputIndexes": [ 2997 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.9/mlp/down_proj/Linear", "inputIndexes": [ 2997 ] , "outputIndexes": [ 2998 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 38430366, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.9/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 2998 ] , "outputIndexes": [ 2999 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 2999 ] , "outputIndexes": [ 934 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_49_output_0", "inputIndexes": [ 928, 934 ] , "outputIndexes": [ 935 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_90_output_0", "inputIndexes": [ 935, 3 ] , "outputIndexes": [ 936 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_10/Mul_1_output_0", "inputIndexes": [ 936 ] , "outputIndexes": [ 937 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 39370660, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 937 ] , "outputIndexes": [ 3000 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3000 ] , "outputIndexes": [ 3001 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/self_attn/q_proj/Linear", "inputIndexes": [ 3001 ] , "outputIndexes": [ 3002 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 39375268, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3002 ] , "outputIndexes": [ 3003 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3003 ] , "outputIndexes": [ 938 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_140_output_0", "inputIndexes": [ 937 ] , "outputIndexes": [ 939 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3818", "inputIndexes": [ 939 ] , "outputIndexes": [ 940 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3820", "inputIndexes": [ 939 ] , "outputIndexes": [ 941 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3822", "inputIndexes": [ 941, 941 ] , "outputIndexes": [ 942 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3823", "inputIndexes": [ 942 ] , "outputIndexes": [ 943 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3825", "inputIndexes": [ 942, 12 ] , "outputIndexes": [ 944 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3826", "inputIndexes": [ 944 ] , "outputIndexes": [ 945 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3829", "inputIndexes": [ 940, 943, 945, 15 ] , "outputIndexes": [ 946 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3830", "inputIndexes": [ 946 ] , "outputIndexes": [ 947 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3832", "inputIndexes": [ 947, 947 ] , "outputIndexes": [ 948 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_153_output_0", "inputIndexes": [ 939, 948, 942 ] , "outputIndexes": [ 949 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_320_output_0", "inputIndexes": [ 949, 20 ] , "outputIndexes": [ 950 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3840", "inputIndexes": [ 942 ] , "outputIndexes": [ 951 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3843", "inputIndexes": [ 944 ] , "outputIndexes": [ 952 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3846", "inputIndexes": [ 940, 951, 952, 15 ] , "outputIndexes": [ 953 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3847", "inputIndexes": [ 953 ] , "outputIndexes": [ 954 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3848", "inputIndexes": [ 12, 954 ] , "outputIndexes": [ 955 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3849", "inputIndexes": [ 955, 954 ] , "outputIndexes": [ 956 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_154_output_0", "inputIndexes": [ 939, 956, 942 ] , "outputIndexes": [ 957 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_321_output_0", "inputIndexes": [ 957, 20 ] , "outputIndexes": [ 958 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_130_output_0", "inputIndexes": [ 950, 958, 30, 31 ] , "outputIndexes": [ 959 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_91_output_0", "inputIndexes": [ 938, 959 ] , "outputIndexes": [ 960 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_80_output_0", "inputIndexes": [ 960, 58 ] , "outputIndexes": [ 961 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_142_output_0", "inputIndexes": [ 960 ] , "outputIndexes": [ 962 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3950", "inputIndexes": [ 962 ] , "outputIndexes": [ 963 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3952", "inputIndexes": [ 962 ] , "outputIndexes": [ 964 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3954", "inputIndexes": [ 964, 964 ] , "outputIndexes": [ 965 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3955", "inputIndexes": [ 965 ] , "outputIndexes": [ 966 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3957", "inputIndexes": [ 965, 12 ] , "outputIndexes": [ 967 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3958", "inputIndexes": [ 967 ] , "outputIndexes": [ 968 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3961", "inputIndexes": [ 963, 966, 968, 15 ] , "outputIndexes": [ 969 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3962", "inputIndexes": [ 969 ] , "outputIndexes": [ 970 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3963", "inputIndexes": [ 61, 970 ] , "outputIndexes": [ 971 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3964", "inputIndexes": [ 971, 970 ] , "outputIndexes": [ 972 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_155_output_0", "inputIndexes": [ 962, 972, 965 ] , "outputIndexes": [ 973 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_30_output_0", "inputIndexes": [ 973, 73 ] , "outputIndexes": [ 974 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_327_output_0", "inputIndexes": [ 974, 20 ] , "outputIndexes": [ 975 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_41_output_0", "inputIndexes": [ 960, 975, 76, 77, 15 ] , "outputIndexes": [ 976 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_20_output_0", "inputIndexes": [ 976 ] , "outputIndexes": [ 977 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_326_output_0", "inputIndexes": [ 974, 20 ] , "outputIndexes": [ 978 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_40_output_0", "inputIndexes": [ 960, 20, 978, 77, 15 ] , "outputIndexes": [ 979 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_133_output_0", "inputIndexes": [ 977, 979 ] , "outputIndexes": [ 980 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_81_output_0", "inputIndexes": [ 980, 89 ] , "outputIndexes": [ 981 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_50_output_0", "inputIndexes": [ 961, 981 ] , "outputIndexes": [ 982 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/self_attn/k_proj/Linear", "inputIndexes": [ 3001 ] , "outputIndexes": [ 3006 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 39748778, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3006 ] , "outputIndexes": [ 3007 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3007 ] , "outputIndexes": [ 983 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_322_output_0", "inputIndexes": [ 949, 20 ] , "outputIndexes": [ 984 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_323_output_0", "inputIndexes": [ 957, 20 ] , "outputIndexes": [ 985 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_131_output_0", "inputIndexes": [ 984, 985, 77, 31 ] , "outputIndexes": [ 986 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_92_output_0", "inputIndexes": [ 983, 986 ] , "outputIndexes": [ 987 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_82_output_0", "inputIndexes": [ 987, 58 ] , "outputIndexes": [ 988 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_143_output_0", "inputIndexes": [ 987 ] , "outputIndexes": [ 989 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape3856", "inputIndexes": [ 989 ] , "outputIndexes": [ 990 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank3858", "inputIndexes": [ 989 ] , "outputIndexes": [ 991 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3860", "inputIndexes": [ 991, 991 ] , "outputIndexes": [ 992 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3861", "inputIndexes": [ 992 ] , "outputIndexes": [ 993 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3863", "inputIndexes": [ 992, 12 ] , "outputIndexes": [ 994 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze3864", "inputIndexes": [ 994 ] , "outputIndexes": [ 995 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice3867", "inputIndexes": [ 990, 993, 995, 15 ] , "outputIndexes": [ 996 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze3868", "inputIndexes": [ 996 ] , "outputIndexes": [ 997 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3869", "inputIndexes": [ 61, 997 ] , "outputIndexes": [ 998 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp3870", "inputIndexes": [ 998, 997 ] , "outputIndexes": [ 999 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_156_output_0", "inputIndexes": [ 989, 999, 992 ] , "outputIndexes": [ 1000 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_31_output_0", "inputIndexes": [ 1000, 73 ] , "outputIndexes": [ 1001 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_329_output_0", "inputIndexes": [ 1001, 20 ] , "outputIndexes": [ 1002 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_43_output_0", "inputIndexes": [ 987, 1002, 76, 77, 15 ] , "outputIndexes": [ 1003 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_21_output_0", "inputIndexes": [ 1003 ] , "outputIndexes": [ 1004 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_328_output_0", "inputIndexes": [ 1001, 20 ] , "outputIndexes": [ 1005 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_42_output_0", "inputIndexes": [ 987, 20, 1005, 77, 15 ] , "outputIndexes": [ 1006 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_134_output_0", "inputIndexes": [ 1004, 1006 ] , "outputIndexes": [ 1007 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_83_output_0", "inputIndexes": [ 1007, 89 ] , "outputIndexes": [ 1008 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_51_output_0", "inputIndexes": [ 988, 1008 ] , "outputIndexes": [ 1009 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/self_attn/v_proj/Linear", "inputIndexes": [ 3001 ] , "outputIndexes": [ 3010 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 39873456, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3010 ] , "outputIndexes": [ 3011 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3011 ] , "outputIndexes": [ 1010 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_324_output_0", "inputIndexes": [ 949, 20 ] , "outputIndexes": [ 1011 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_325_output_0", "inputIndexes": [ 957, 20 ] , "outputIndexes": [ 1012 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_132_output_0", "inputIndexes": [ 1011, 1012, 77, 31 ] , "outputIndexes": [ 1013 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_93_output_0", "inputIndexes": [ 1010, 1013 ] , "outputIndexes": [ 1014 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_98_output_0", "inputIndexes": [ 982, 1009, 1014, 124 ] , "outputIndexes": [ 1015 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1015 ] , "outputIndexes": [ 3012 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3012 ] , "outputIndexes": [ 3013 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/self_attn/o_proj/Linear", "inputIndexes": [ 3013 ] , "outputIndexes": [ 3014 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 39998134, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3014 ] , "outputIndexes": [ 3015 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3015 ] , "outputIndexes": [ 1016 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_53_output_0", "inputIndexes": [ 936, 1016 ] , "outputIndexes": [ 1017 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_10/Mul_1_output_0", "inputIndexes": [ 1017 ] , "outputIndexes": [ 1018 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 40371644, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1018 ] , "outputIndexes": [ 3016 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3016 ] , "outputIndexes": [ 3017 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/mlp/gate_proj/Linear", "inputIndexes": [ 3017 ] , "outputIndexes": [ 3018 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 40376252, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3018 ] , "outputIndexes": [ 3019 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3019 ] , "outputIndexes": [ 1019 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_10/Mul_output_0", "inputIndexes": [ 1019 ] , "outputIndexes": [ 1020 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/mlp/up_proj/Linear", "inputIndexes": [ 3017 ] , "outputIndexes": [ 3022 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 41371842, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3022 ] , "outputIndexes": [ 3023 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3023 ] , "outputIndexes": [ 1021 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_10/Mul_output_0", "inputIndexes": [ 1020, 1021 ] , "outputIndexes": [ 1022 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1022 ] , "outputIndexes": [ 3024 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3024 ] , "outputIndexes": [ 3025 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.10/mlp/down_proj/Linear", "inputIndexes": [ 3025 ] , "outputIndexes": [ 3026 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 42367432, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.10/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3026 ] , "outputIndexes": [ 3027 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3027 ] , "outputIndexes": [ 1023 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_54_output_0", "inputIndexes": [ 1017, 1023 ] , "outputIndexes": [ 1024 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_99_output_0", "inputIndexes": [ 1024, 3 ] , "outputIndexes": [ 1025 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_11/Mul_1_output_0", "inputIndexes": [ 1025 ] , "outputIndexes": [ 1026 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 43307726, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1026 ] , "outputIndexes": [ 3028 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3028 ] , "outputIndexes": [ 3029 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/self_attn/q_proj/Linear", "inputIndexes": [ 3029 ] , "outputIndexes": [ 3030 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43312334, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3030 ] , "outputIndexes": [ 3031 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3031 ] , "outputIndexes": [ 1027 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_154_output_0", "inputIndexes": [ 1026 ] , "outputIndexes": [ 1028 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4189", "inputIndexes": [ 1028 ] , "outputIndexes": [ 1029 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4191", "inputIndexes": [ 1028 ] , "outputIndexes": [ 1030 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4193", "inputIndexes": [ 1030, 1030 ] , "outputIndexes": [ 1031 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4194", "inputIndexes": [ 1031 ] , "outputIndexes": [ 1032 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4196", "inputIndexes": [ 1031, 12 ] , "outputIndexes": [ 1033 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4197", "inputIndexes": [ 1033 ] , "outputIndexes": [ 1034 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4200", "inputIndexes": [ 1029, 1032, 1034, 15 ] , "outputIndexes": [ 1035 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4201", "inputIndexes": [ 1035 ] , "outputIndexes": [ 1036 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4203", "inputIndexes": [ 1036, 1036 ] , "outputIndexes": [ 1037 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_168_output_0", "inputIndexes": [ 1028, 1037, 1031 ] , "outputIndexes": [ 1038 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_352_output_0", "inputIndexes": [ 1038, 20 ] , "outputIndexes": [ 1039 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4211", "inputIndexes": [ 1031 ] , "outputIndexes": [ 1040 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4214", "inputIndexes": [ 1033 ] , "outputIndexes": [ 1041 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4217", "inputIndexes": [ 1029, 1040, 1041, 15 ] , "outputIndexes": [ 1042 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4218", "inputIndexes": [ 1042 ] , "outputIndexes": [ 1043 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4219", "inputIndexes": [ 12, 1043 ] , "outputIndexes": [ 1044 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4220", "inputIndexes": [ 1044, 1043 ] , "outputIndexes": [ 1045 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_169_output_0", "inputIndexes": [ 1028, 1045, 1031 ] , "outputIndexes": [ 1046 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_353_output_0", "inputIndexes": [ 1046, 20 ] , "outputIndexes": [ 1047 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_143_output_0", "inputIndexes": [ 1039, 1047, 30, 31 ] , "outputIndexes": [ 1048 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_100_output_0", "inputIndexes": [ 1027, 1048 ] , "outputIndexes": [ 1049 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_88_output_0", "inputIndexes": [ 1049, 58 ] , "outputIndexes": [ 1050 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_156_output_0", "inputIndexes": [ 1049 ] , "outputIndexes": [ 1051 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4321", "inputIndexes": [ 1051 ] , "outputIndexes": [ 1052 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4323", "inputIndexes": [ 1051 ] , "outputIndexes": [ 1053 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4325", "inputIndexes": [ 1053, 1053 ] , "outputIndexes": [ 1054 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4326", "inputIndexes": [ 1054 ] , "outputIndexes": [ 1055 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4328", "inputIndexes": [ 1054, 12 ] , "outputIndexes": [ 1056 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4329", "inputIndexes": [ 1056 ] , "outputIndexes": [ 1057 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4332", "inputIndexes": [ 1052, 1055, 1057, 15 ] , "outputIndexes": [ 1058 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4333", "inputIndexes": [ 1058 ] , "outputIndexes": [ 1059 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4334", "inputIndexes": [ 61, 1059 ] , "outputIndexes": [ 1060 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4335", "inputIndexes": [ 1060, 1059 ] , "outputIndexes": [ 1061 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_170_output_0", "inputIndexes": [ 1051, 1061, 1054 ] , "outputIndexes": [ 1062 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_33_output_0", "inputIndexes": [ 1062, 73 ] , "outputIndexes": [ 1063 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_359_output_0", "inputIndexes": [ 1063, 20 ] , "outputIndexes": [ 1064 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_45_output_0", "inputIndexes": [ 1049, 1064, 76, 77, 15 ] , "outputIndexes": [ 1065 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_22_output_0", "inputIndexes": [ 1065 ] , "outputIndexes": [ 1066 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_358_output_0", "inputIndexes": [ 1063, 20 ] , "outputIndexes": [ 1067 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_44_output_0", "inputIndexes": [ 1049, 20, 1067, 77, 15 ] , "outputIndexes": [ 1068 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_146_output_0", "inputIndexes": [ 1066, 1068 ] , "outputIndexes": [ 1069 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_89_output_0", "inputIndexes": [ 1069, 89 ] , "outputIndexes": [ 1070 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_55_output_0", "inputIndexes": [ 1050, 1070 ] , "outputIndexes": [ 1071 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/self_attn/k_proj/Linear", "inputIndexes": [ 3029 ] , "outputIndexes": [ 3034 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43685844, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3034 ] , "outputIndexes": [ 3035 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3035 ] , "outputIndexes": [ 1072 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_354_output_0", "inputIndexes": [ 1038, 20 ] , "outputIndexes": [ 1073 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_355_output_0", "inputIndexes": [ 1046, 20 ] , "outputIndexes": [ 1074 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_144_output_0", "inputIndexes": [ 1073, 1074, 77, 31 ] , "outputIndexes": [ 1075 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_101_output_0", "inputIndexes": [ 1072, 1075 ] , "outputIndexes": [ 1076 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_90_output_0", "inputIndexes": [ 1076, 58 ] , "outputIndexes": [ 1077 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_157_output_0", "inputIndexes": [ 1076 ] , "outputIndexes": [ 1078 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4227", "inputIndexes": [ 1078 ] , "outputIndexes": [ 1079 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4229", "inputIndexes": [ 1078 ] , "outputIndexes": [ 1080 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4231", "inputIndexes": [ 1080, 1080 ] , "outputIndexes": [ 1081 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4232", "inputIndexes": [ 1081 ] , "outputIndexes": [ 1082 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4234", "inputIndexes": [ 1081, 12 ] , "outputIndexes": [ 1083 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4235", "inputIndexes": [ 1083 ] , "outputIndexes": [ 1084 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4238", "inputIndexes": [ 1079, 1082, 1084, 15 ] , "outputIndexes": [ 1085 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4239", "inputIndexes": [ 1085 ] , "outputIndexes": [ 1086 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4240", "inputIndexes": [ 61, 1086 ] , "outputIndexes": [ 1087 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4241", "inputIndexes": [ 1087, 1086 ] , "outputIndexes": [ 1088 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_171_output_0", "inputIndexes": [ 1078, 1088, 1081 ] , "outputIndexes": [ 1089 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_34_output_0", "inputIndexes": [ 1089, 73 ] , "outputIndexes": [ 1090 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_361_output_0", "inputIndexes": [ 1090, 20 ] , "outputIndexes": [ 1091 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_47_output_0", "inputIndexes": [ 1076, 1091, 76, 77, 15 ] , "outputIndexes": [ 1092 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_23_output_0", "inputIndexes": [ 1092 ] , "outputIndexes": [ 1093 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_360_output_0", "inputIndexes": [ 1090, 20 ] , "outputIndexes": [ 1094 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_46_output_0", "inputIndexes": [ 1076, 20, 1094, 77, 15 ] , "outputIndexes": [ 1095 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_147_output_0", "inputIndexes": [ 1093, 1095 ] , "outputIndexes": [ 1096 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_91_output_0", "inputIndexes": [ 1096, 89 ] , "outputIndexes": [ 1097 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_56_output_0", "inputIndexes": [ 1077, 1097 ] , "outputIndexes": [ 1098 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/self_attn/v_proj/Linear", "inputIndexes": [ 3029 ] , "outputIndexes": [ 3038 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43810522, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3038 ] , "outputIndexes": [ 3039 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3039 ] , "outputIndexes": [ 1099 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_356_output_0", "inputIndexes": [ 1038, 20 ] , "outputIndexes": [ 1100 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_357_output_0", "inputIndexes": [ 1046, 20 ] , "outputIndexes": [ 1101 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_145_output_0", "inputIndexes": [ 1100, 1101, 77, 31 ] , "outputIndexes": [ 1102 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_102_output_0", "inputIndexes": [ 1099, 1102 ] , "outputIndexes": [ 1103 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_107_output_0", "inputIndexes": [ 1071, 1098, 1103, 124 ] , "outputIndexes": [ 1104 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1104 ] , "outputIndexes": [ 3040 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3040 ] , "outputIndexes": [ 3041 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/self_attn/o_proj/Linear", "inputIndexes": [ 3041 ] , "outputIndexes": [ 3042 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43935200, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3042 ] , "outputIndexes": [ 3043 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3043 ] , "outputIndexes": [ 1105 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_58_output_0", "inputIndexes": [ 1025, 1105 ] , "outputIndexes": [ 1106 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_11/Mul_1_output_0", "inputIndexes": [ 1106 ] , "outputIndexes": [ 1107 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 44308710, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1107 ] , "outputIndexes": [ 3044 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3044 ] , "outputIndexes": [ 3045 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/mlp/gate_proj/Linear", "inputIndexes": [ 3045 ] , "outputIndexes": [ 3046 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 44313318, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3046 ] , "outputIndexes": [ 3047 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3047 ] , "outputIndexes": [ 1108 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_11/Mul_output_0", "inputIndexes": [ 1108 ] , "outputIndexes": [ 1109 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/mlp/up_proj/Linear", "inputIndexes": [ 3045 ] , "outputIndexes": [ 3050 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 45308908, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3050 ] , "outputIndexes": [ 3051 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3051 ] , "outputIndexes": [ 1110 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_11/Mul_output_0", "inputIndexes": [ 1109, 1110 ] , "outputIndexes": [ 1111 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1111 ] , "outputIndexes": [ 3052 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3052 ] , "outputIndexes": [ 3053 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.11/mlp/down_proj/Linear", "inputIndexes": [ 3053 ] , "outputIndexes": [ 3054 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 46304498, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.11/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3054 ] , "outputIndexes": [ 3055 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3055 ] , "outputIndexes": [ 1112 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_59_output_0", "inputIndexes": [ 1106, 1112 ] , "outputIndexes": [ 1113 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_108_output_0", "inputIndexes": [ 1113, 3 ] , "outputIndexes": [ 1114 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_12/Mul_1_output_0", "inputIndexes": [ 1114 ] , "outputIndexes": [ 1115 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 47244792, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1115 ] , "outputIndexes": [ 3056 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3056 ] , "outputIndexes": [ 3057 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/self_attn/q_proj/Linear", "inputIndexes": [ 3057 ] , "outputIndexes": [ 3058 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47249400, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3058 ] , "outputIndexes": [ 3059 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3059 ] , "outputIndexes": [ 1116 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_168_output_0", "inputIndexes": [ 1115 ] , "outputIndexes": [ 1117 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4560", "inputIndexes": [ 1117 ] , "outputIndexes": [ 1118 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4562", "inputIndexes": [ 1117 ] , "outputIndexes": [ 1119 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4564", "inputIndexes": [ 1119, 1119 ] , "outputIndexes": [ 1120 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4565", "inputIndexes": [ 1120 ] , "outputIndexes": [ 1121 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4567", "inputIndexes": [ 1120, 12 ] , "outputIndexes": [ 1122 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4568", "inputIndexes": [ 1122 ] , "outputIndexes": [ 1123 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4571", "inputIndexes": [ 1118, 1121, 1123, 15 ] , "outputIndexes": [ 1124 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4572", "inputIndexes": [ 1124 ] , "outputIndexes": [ 1125 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4574", "inputIndexes": [ 1125, 1125 ] , "outputIndexes": [ 1126 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_183_output_0", "inputIndexes": [ 1117, 1126, 1120 ] , "outputIndexes": [ 1127 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_384_output_0", "inputIndexes": [ 1127, 20 ] , "outputIndexes": [ 1128 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4582", "inputIndexes": [ 1120 ] , "outputIndexes": [ 1129 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4585", "inputIndexes": [ 1122 ] , "outputIndexes": [ 1130 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4588", "inputIndexes": [ 1118, 1129, 1130, 15 ] , "outputIndexes": [ 1131 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4589", "inputIndexes": [ 1131 ] , "outputIndexes": [ 1132 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4590", "inputIndexes": [ 12, 1132 ] , "outputIndexes": [ 1133 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4591", "inputIndexes": [ 1133, 1132 ] , "outputIndexes": [ 1134 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_184_output_0", "inputIndexes": [ 1117, 1134, 1120 ] , "outputIndexes": [ 1135 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_385_output_0", "inputIndexes": [ 1135, 20 ] , "outputIndexes": [ 1136 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_156_output_0", "inputIndexes": [ 1128, 1136, 30, 31 ] , "outputIndexes": [ 1137 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_109_output_0", "inputIndexes": [ 1116, 1137 ] , "outputIndexes": [ 1138 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_96_output_0", "inputIndexes": [ 1138, 58 ] , "outputIndexes": [ 1139 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_170_output_0", "inputIndexes": [ 1138 ] , "outputIndexes": [ 1140 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4692", "inputIndexes": [ 1140 ] , "outputIndexes": [ 1141 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4694", "inputIndexes": [ 1140 ] , "outputIndexes": [ 1142 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4696", "inputIndexes": [ 1142, 1142 ] , "outputIndexes": [ 1143 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4697", "inputIndexes": [ 1143 ] , "outputIndexes": [ 1144 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4699", "inputIndexes": [ 1143, 12 ] , "outputIndexes": [ 1145 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4700", "inputIndexes": [ 1145 ] , "outputIndexes": [ 1146 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4703", "inputIndexes": [ 1141, 1144, 1146, 15 ] , "outputIndexes": [ 1147 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4704", "inputIndexes": [ 1147 ] , "outputIndexes": [ 1148 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4705", "inputIndexes": [ 61, 1148 ] , "outputIndexes": [ 1149 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4706", "inputIndexes": [ 1149, 1148 ] , "outputIndexes": [ 1150 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_185_output_0", "inputIndexes": [ 1140, 1150, 1143 ] , "outputIndexes": [ 1151 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_36_output_0", "inputIndexes": [ 1151, 73 ] , "outputIndexes": [ 1152 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_391_output_0", "inputIndexes": [ 1152, 20 ] , "outputIndexes": [ 1153 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_49_output_0", "inputIndexes": [ 1138, 1153, 76, 77, 15 ] , "outputIndexes": [ 1154 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_24_output_0", "inputIndexes": [ 1154 ] , "outputIndexes": [ 1155 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_390_output_0", "inputIndexes": [ 1152, 20 ] , "outputIndexes": [ 1156 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_48_output_0", "inputIndexes": [ 1138, 20, 1156, 77, 15 ] , "outputIndexes": [ 1157 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_159_output_0", "inputIndexes": [ 1155, 1157 ] , "outputIndexes": [ 1158 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_97_output_0", "inputIndexes": [ 1158, 89 ] , "outputIndexes": [ 1159 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_60_output_0", "inputIndexes": [ 1139, 1159 ] , "outputIndexes": [ 1160 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/self_attn/k_proj/Linear", "inputIndexes": [ 3057 ] , "outputIndexes": [ 3062 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47622910, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3062 ] , "outputIndexes": [ 3063 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3063 ] , "outputIndexes": [ 1161 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_386_output_0", "inputIndexes": [ 1127, 20 ] , "outputIndexes": [ 1162 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_387_output_0", "inputIndexes": [ 1135, 20 ] , "outputIndexes": [ 1163 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_157_output_0", "inputIndexes": [ 1162, 1163, 77, 31 ] , "outputIndexes": [ 1164 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_110_output_0", "inputIndexes": [ 1161, 1164 ] , "outputIndexes": [ 1165 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_98_output_0", "inputIndexes": [ 1165, 58 ] , "outputIndexes": [ 1166 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_171_output_0", "inputIndexes": [ 1165 ] , "outputIndexes": [ 1167 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4598", "inputIndexes": [ 1167 ] , "outputIndexes": [ 1168 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4600", "inputIndexes": [ 1167 ] , "outputIndexes": [ 1169 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4602", "inputIndexes": [ 1169, 1169 ] , "outputIndexes": [ 1170 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4603", "inputIndexes": [ 1170 ] , "outputIndexes": [ 1171 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4605", "inputIndexes": [ 1170, 12 ] , "outputIndexes": [ 1172 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4606", "inputIndexes": [ 1172 ] , "outputIndexes": [ 1173 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4609", "inputIndexes": [ 1168, 1171, 1173, 15 ] , "outputIndexes": [ 1174 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4610", "inputIndexes": [ 1174 ] , "outputIndexes": [ 1175 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4611", "inputIndexes": [ 61, 1175 ] , "outputIndexes": [ 1176 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4612", "inputIndexes": [ 1176, 1175 ] , "outputIndexes": [ 1177 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_186_output_0", "inputIndexes": [ 1167, 1177, 1170 ] , "outputIndexes": [ 1178 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_37_output_0", "inputIndexes": [ 1178, 73 ] , "outputIndexes": [ 1179 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_393_output_0", "inputIndexes": [ 1179, 20 ] , "outputIndexes": [ 1180 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_51_output_0", "inputIndexes": [ 1165, 1180, 76, 77, 15 ] , "outputIndexes": [ 1181 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_25_output_0", "inputIndexes": [ 1181 ] , "outputIndexes": [ 1182 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_392_output_0", "inputIndexes": [ 1179, 20 ] , "outputIndexes": [ 1183 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_50_output_0", "inputIndexes": [ 1165, 20, 1183, 77, 15 ] , "outputIndexes": [ 1184 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_160_output_0", "inputIndexes": [ 1182, 1184 ] , "outputIndexes": [ 1185 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_99_output_0", "inputIndexes": [ 1185, 89 ] , "outputIndexes": [ 1186 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_61_output_0", "inputIndexes": [ 1166, 1186 ] , "outputIndexes": [ 1187 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/self_attn/v_proj/Linear", "inputIndexes": [ 3057 ] , "outputIndexes": [ 3066 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47747588, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3066 ] , "outputIndexes": [ 3067 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3067 ] , "outputIndexes": [ 1188 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_388_output_0", "inputIndexes": [ 1127, 20 ] , "outputIndexes": [ 1189 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_389_output_0", "inputIndexes": [ 1135, 20 ] , "outputIndexes": [ 1190 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_158_output_0", "inputIndexes": [ 1189, 1190, 77, 31 ] , "outputIndexes": [ 1191 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_111_output_0", "inputIndexes": [ 1188, 1191 ] , "outputIndexes": [ 1192 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_116_output_0", "inputIndexes": [ 1160, 1187, 1192, 124 ] , "outputIndexes": [ 1193 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1193 ] , "outputIndexes": [ 3068 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3068 ] , "outputIndexes": [ 3069 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/self_attn/o_proj/Linear", "inputIndexes": [ 3069 ] , "outputIndexes": [ 3070 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47872266, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3070 ] , "outputIndexes": [ 3071 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3071 ] , "outputIndexes": [ 1194 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_63_output_0", "inputIndexes": [ 1114, 1194 ] , "outputIndexes": [ 1195 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_12/Mul_1_output_0", "inputIndexes": [ 1195 ] , "outputIndexes": [ 1196 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 48245776, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1196 ] , "outputIndexes": [ 3072 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3072 ] , "outputIndexes": [ 3073 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/mlp/gate_proj/Linear", "inputIndexes": [ 3073 ] , "outputIndexes": [ 3074 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 48250384, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3074 ] , "outputIndexes": [ 3075 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3075 ] , "outputIndexes": [ 1197 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_12/Mul_output_0", "inputIndexes": [ 1197 ] , "outputIndexes": [ 1198 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/mlp/up_proj/Linear", "inputIndexes": [ 3073 ] , "outputIndexes": [ 3078 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 49245974, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3078 ] , "outputIndexes": [ 3079 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3079 ] , "outputIndexes": [ 1199 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_12/Mul_output_0", "inputIndexes": [ 1198, 1199 ] , "outputIndexes": [ 1200 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1200 ] , "outputIndexes": [ 3080 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3080 ] , "outputIndexes": [ 3081 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.12/mlp/down_proj/Linear", "inputIndexes": [ 3081 ] , "outputIndexes": [ 3082 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 50241564, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.12/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3082 ] , "outputIndexes": [ 3083 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3083 ] , "outputIndexes": [ 1201 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_64_output_0", "inputIndexes": [ 1195, 1201 ] , "outputIndexes": [ 1202 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_117_output_0", "inputIndexes": [ 1202, 3 ] , "outputIndexes": [ 1203 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_13/Mul_1_output_0", "inputIndexes": [ 1203 ] , "outputIndexes": [ 1204 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 51181858, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1204 ] , "outputIndexes": [ 3084 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3084 ] , "outputIndexes": [ 3085 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/self_attn/q_proj/Linear", "inputIndexes": [ 3085 ] , "outputIndexes": [ 3086 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 51186466, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3086 ] , "outputIndexes": [ 3087 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3087 ] , "outputIndexes": [ 1205 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_182_output_0", "inputIndexes": [ 1204 ] , "outputIndexes": [ 1206 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4931", "inputIndexes": [ 1206 ] , "outputIndexes": [ 1207 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4933", "inputIndexes": [ 1206 ] , "outputIndexes": [ 1208 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4935", "inputIndexes": [ 1208, 1208 ] , "outputIndexes": [ 1209 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4936", "inputIndexes": [ 1209 ] , "outputIndexes": [ 1210 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4938", "inputIndexes": [ 1209, 12 ] , "outputIndexes": [ 1211 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4939", "inputIndexes": [ 1211 ] , "outputIndexes": [ 1212 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4942", "inputIndexes": [ 1207, 1210, 1212, 15 ] , "outputIndexes": [ 1213 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4943", "inputIndexes": [ 1213 ] , "outputIndexes": [ 1214 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4945", "inputIndexes": [ 1214, 1214 ] , "outputIndexes": [ 1215 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_198_output_0", "inputIndexes": [ 1206, 1215, 1209 ] , "outputIndexes": [ 1216 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_416_output_0", "inputIndexes": [ 1216, 20 ] , "outputIndexes": [ 1217 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4953", "inputIndexes": [ 1209 ] , "outputIndexes": [ 1218 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4956", "inputIndexes": [ 1211 ] , "outputIndexes": [ 1219 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4959", "inputIndexes": [ 1207, 1218, 1219, 15 ] , "outputIndexes": [ 1220 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4960", "inputIndexes": [ 1220 ] , "outputIndexes": [ 1221 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4961", "inputIndexes": [ 12, 1221 ] , "outputIndexes": [ 1222 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4962", "inputIndexes": [ 1222, 1221 ] , "outputIndexes": [ 1223 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_199_output_0", "inputIndexes": [ 1206, 1223, 1209 ] , "outputIndexes": [ 1224 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_417_output_0", "inputIndexes": [ 1224, 20 ] , "outputIndexes": [ 1225 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_169_output_0", "inputIndexes": [ 1217, 1225, 30, 31 ] , "outputIndexes": [ 1226 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_118_output_0", "inputIndexes": [ 1205, 1226 ] , "outputIndexes": [ 1227 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_104_output_0", "inputIndexes": [ 1227, 58 ] , "outputIndexes": [ 1228 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_184_output_0", "inputIndexes": [ 1227 ] , "outputIndexes": [ 1229 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5063", "inputIndexes": [ 1229 ] , "outputIndexes": [ 1230 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5065", "inputIndexes": [ 1229 ] , "outputIndexes": [ 1231 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5067", "inputIndexes": [ 1231, 1231 ] , "outputIndexes": [ 1232 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5068", "inputIndexes": [ 1232 ] , "outputIndexes": [ 1233 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5070", "inputIndexes": [ 1232, 12 ] , "outputIndexes": [ 1234 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5071", "inputIndexes": [ 1234 ] , "outputIndexes": [ 1235 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5074", "inputIndexes": [ 1230, 1233, 1235, 15 ] , "outputIndexes": [ 1236 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5075", "inputIndexes": [ 1236 ] , "outputIndexes": [ 1237 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5076", "inputIndexes": [ 61, 1237 ] , "outputIndexes": [ 1238 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5077", "inputIndexes": [ 1238, 1237 ] , "outputIndexes": [ 1239 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_200_output_0", "inputIndexes": [ 1229, 1239, 1232 ] , "outputIndexes": [ 1240 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_39_output_0", "inputIndexes": [ 1240, 73 ] , "outputIndexes": [ 1241 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_423_output_0", "inputIndexes": [ 1241, 20 ] , "outputIndexes": [ 1242 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_53_output_0", "inputIndexes": [ 1227, 1242, 76, 77, 15 ] , "outputIndexes": [ 1243 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_26_output_0", "inputIndexes": [ 1243 ] , "outputIndexes": [ 1244 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_422_output_0", "inputIndexes": [ 1241, 20 ] , "outputIndexes": [ 1245 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_52_output_0", "inputIndexes": [ 1227, 20, 1245, 77, 15 ] , "outputIndexes": [ 1246 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_172_output_0", "inputIndexes": [ 1244, 1246 ] , "outputIndexes": [ 1247 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_105_output_0", "inputIndexes": [ 1247, 89 ] , "outputIndexes": [ 1248 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_65_output_0", "inputIndexes": [ 1228, 1248 ] , "outputIndexes": [ 1249 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/self_attn/k_proj/Linear", "inputIndexes": [ 3085 ] , "outputIndexes": [ 3090 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 51559976, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3090 ] , "outputIndexes": [ 3091 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3091 ] , "outputIndexes": [ 1250 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_418_output_0", "inputIndexes": [ 1216, 20 ] , "outputIndexes": [ 1251 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_419_output_0", "inputIndexes": [ 1224, 20 ] , "outputIndexes": [ 1252 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_170_output_0", "inputIndexes": [ 1251, 1252, 77, 31 ] , "outputIndexes": [ 1253 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_119_output_0", "inputIndexes": [ 1250, 1253 ] , "outputIndexes": [ 1254 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_106_output_0", "inputIndexes": [ 1254, 58 ] , "outputIndexes": [ 1255 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_185_output_0", "inputIndexes": [ 1254 ] , "outputIndexes": [ 1256 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape4969", "inputIndexes": [ 1256 ] , "outputIndexes": [ 1257 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank4971", "inputIndexes": [ 1256 ] , "outputIndexes": [ 1258 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4973", "inputIndexes": [ 1258, 1258 ] , "outputIndexes": [ 1259 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4974", "inputIndexes": [ 1259 ] , "outputIndexes": [ 1260 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4976", "inputIndexes": [ 1259, 12 ] , "outputIndexes": [ 1261 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze4977", "inputIndexes": [ 1261 ] , "outputIndexes": [ 1262 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice4980", "inputIndexes": [ 1257, 1260, 1262, 15 ] , "outputIndexes": [ 1263 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze4981", "inputIndexes": [ 1263 ] , "outputIndexes": [ 1264 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4982", "inputIndexes": [ 61, 1264 ] , "outputIndexes": [ 1265 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp4983", "inputIndexes": [ 1265, 1264 ] , "outputIndexes": [ 1266 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_201_output_0", "inputIndexes": [ 1256, 1266, 1259 ] , "outputIndexes": [ 1267 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_40_output_0", "inputIndexes": [ 1267, 73 ] , "outputIndexes": [ 1268 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_425_output_0", "inputIndexes": [ 1268, 20 ] , "outputIndexes": [ 1269 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_55_output_0", "inputIndexes": [ 1254, 1269, 76, 77, 15 ] , "outputIndexes": [ 1270 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_27_output_0", "inputIndexes": [ 1270 ] , "outputIndexes": [ 1271 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_424_output_0", "inputIndexes": [ 1268, 20 ] , "outputIndexes": [ 1272 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_54_output_0", "inputIndexes": [ 1254, 20, 1272, 77, 15 ] , "outputIndexes": [ 1273 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_173_output_0", "inputIndexes": [ 1271, 1273 ] , "outputIndexes": [ 1274 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_107_output_0", "inputIndexes": [ 1274, 89 ] , "outputIndexes": [ 1275 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_66_output_0", "inputIndexes": [ 1255, 1275 ] , "outputIndexes": [ 1276 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/self_attn/v_proj/Linear", "inputIndexes": [ 3085 ] , "outputIndexes": [ 3094 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 51684654, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3094 ] , "outputIndexes": [ 3095 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3095 ] , "outputIndexes": [ 1277 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_420_output_0", "inputIndexes": [ 1216, 20 ] , "outputIndexes": [ 1278 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_421_output_0", "inputIndexes": [ 1224, 20 ] , "outputIndexes": [ 1279 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_171_output_0", "inputIndexes": [ 1278, 1279, 77, 31 ] , "outputIndexes": [ 1280 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_120_output_0", "inputIndexes": [ 1277, 1280 ] , "outputIndexes": [ 1281 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_125_output_0", "inputIndexes": [ 1249, 1276, 1281, 124 ] , "outputIndexes": [ 1282 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1282 ] , "outputIndexes": [ 3096 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3096 ] , "outputIndexes": [ 3097 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/self_attn/o_proj/Linear", "inputIndexes": [ 3097 ] , "outputIndexes": [ 3098 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 51809332, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3098 ] , "outputIndexes": [ 3099 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3099 ] , "outputIndexes": [ 1283 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_68_output_0", "inputIndexes": [ 1203, 1283 ] , "outputIndexes": [ 1284 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_13/Mul_1_output_0", "inputIndexes": [ 1284 ] , "outputIndexes": [ 1285 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 52182842, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1285 ] , "outputIndexes": [ 3100 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3100 ] , "outputIndexes": [ 3101 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/mlp/gate_proj/Linear", "inputIndexes": [ 3101 ] , "outputIndexes": [ 3102 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 52187450, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3102 ] , "outputIndexes": [ 3103 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3103 ] , "outputIndexes": [ 1286 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_13/Mul_output_0", "inputIndexes": [ 1286 ] , "outputIndexes": [ 1287 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/mlp/up_proj/Linear", "inputIndexes": [ 3101 ] , "outputIndexes": [ 3106 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 53183040, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3106 ] , "outputIndexes": [ 3107 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3107 ] , "outputIndexes": [ 1288 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_13/Mul_output_0", "inputIndexes": [ 1287, 1288 ] , "outputIndexes": [ 1289 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1289 ] , "outputIndexes": [ 3108 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3108 ] , "outputIndexes": [ 3109 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.13/mlp/down_proj/Linear", "inputIndexes": [ 3109 ] , "outputIndexes": [ 3110 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 54178630, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.13/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3110 ] , "outputIndexes": [ 3111 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3111 ] , "outputIndexes": [ 1290 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_69_output_0", "inputIndexes": [ 1284, 1290 ] , "outputIndexes": [ 1291 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_126_output_0", "inputIndexes": [ 1291, 3 ] , "outputIndexes": [ 1292 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_14/Mul_1_output_0", "inputIndexes": [ 1292 ] , "outputIndexes": [ 1293 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 55118924, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1293 ] , "outputIndexes": [ 3112 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3112 ] , "outputIndexes": [ 3113 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/self_attn/q_proj/Linear", "inputIndexes": [ 3113 ] , "outputIndexes": [ 3114 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 55123532, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3114 ] , "outputIndexes": [ 3115 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3115 ] , "outputIndexes": [ 1294 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_196_output_0", "inputIndexes": [ 1293 ] , "outputIndexes": [ 1295 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5302", "inputIndexes": [ 1295 ] , "outputIndexes": [ 1296 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5304", "inputIndexes": [ 1295 ] , "outputIndexes": [ 1297 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5306", "inputIndexes": [ 1297, 1297 ] , "outputIndexes": [ 1298 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5307", "inputIndexes": [ 1298 ] , "outputIndexes": [ 1299 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5309", "inputIndexes": [ 1298, 12 ] , "outputIndexes": [ 1300 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5310", "inputIndexes": [ 1300 ] , "outputIndexes": [ 1301 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5313", "inputIndexes": [ 1296, 1299, 1301, 15 ] , "outputIndexes": [ 1302 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5314", "inputIndexes": [ 1302 ] , "outputIndexes": [ 1303 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5316", "inputIndexes": [ 1303, 1303 ] , "outputIndexes": [ 1304 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_213_output_0", "inputIndexes": [ 1295, 1304, 1298 ] , "outputIndexes": [ 1305 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_448_output_0", "inputIndexes": [ 1305, 20 ] , "outputIndexes": [ 1306 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5324", "inputIndexes": [ 1298 ] , "outputIndexes": [ 1307 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5327", "inputIndexes": [ 1300 ] , "outputIndexes": [ 1308 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5330", "inputIndexes": [ 1296, 1307, 1308, 15 ] , "outputIndexes": [ 1309 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5331", "inputIndexes": [ 1309 ] , "outputIndexes": [ 1310 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5332", "inputIndexes": [ 12, 1310 ] , "outputIndexes": [ 1311 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5333", "inputIndexes": [ 1311, 1310 ] , "outputIndexes": [ 1312 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_214_output_0", "inputIndexes": [ 1295, 1312, 1298 ] , "outputIndexes": [ 1313 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_449_output_0", "inputIndexes": [ 1313, 20 ] , "outputIndexes": [ 1314 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_182_output_0", "inputIndexes": [ 1306, 1314, 30, 31 ] , "outputIndexes": [ 1315 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_127_output_0", "inputIndexes": [ 1294, 1315 ] , "outputIndexes": [ 1316 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_112_output_0", "inputIndexes": [ 1316, 58 ] , "outputIndexes": [ 1317 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_198_output_0", "inputIndexes": [ 1316 ] , "outputIndexes": [ 1318 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5434", "inputIndexes": [ 1318 ] , "outputIndexes": [ 1319 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5436", "inputIndexes": [ 1318 ] , "outputIndexes": [ 1320 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5438", "inputIndexes": [ 1320, 1320 ] , "outputIndexes": [ 1321 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5439", "inputIndexes": [ 1321 ] , "outputIndexes": [ 1322 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5441", "inputIndexes": [ 1321, 12 ] , "outputIndexes": [ 1323 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5442", "inputIndexes": [ 1323 ] , "outputIndexes": [ 1324 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5445", "inputIndexes": [ 1319, 1322, 1324, 15 ] , "outputIndexes": [ 1325 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5446", "inputIndexes": [ 1325 ] , "outputIndexes": [ 1326 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5447", "inputIndexes": [ 61, 1326 ] , "outputIndexes": [ 1327 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5448", "inputIndexes": [ 1327, 1326 ] , "outputIndexes": [ 1328 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_215_output_0", "inputIndexes": [ 1318, 1328, 1321 ] , "outputIndexes": [ 1329 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_42_output_0", "inputIndexes": [ 1329, 73 ] , "outputIndexes": [ 1330 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_455_output_0", "inputIndexes": [ 1330, 20 ] , "outputIndexes": [ 1331 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_57_output_0", "inputIndexes": [ 1316, 1331, 76, 77, 15 ] , "outputIndexes": [ 1332 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_28_output_0", "inputIndexes": [ 1332 ] , "outputIndexes": [ 1333 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_454_output_0", "inputIndexes": [ 1330, 20 ] , "outputIndexes": [ 1334 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_56_output_0", "inputIndexes": [ 1316, 20, 1334, 77, 15 ] , "outputIndexes": [ 1335 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_185_output_0", "inputIndexes": [ 1333, 1335 ] , "outputIndexes": [ 1336 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_113_output_0", "inputIndexes": [ 1336, 89 ] , "outputIndexes": [ 1337 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_70_output_0", "inputIndexes": [ 1317, 1337 ] , "outputIndexes": [ 1338 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/self_attn/k_proj/Linear", "inputIndexes": [ 3113 ] , "outputIndexes": [ 3118 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 55497042, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3118 ] , "outputIndexes": [ 3119 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3119 ] , "outputIndexes": [ 1339 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_450_output_0", "inputIndexes": [ 1305, 20 ] , "outputIndexes": [ 1340 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_451_output_0", "inputIndexes": [ 1313, 20 ] , "outputIndexes": [ 1341 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_183_output_0", "inputIndexes": [ 1340, 1341, 77, 31 ] , "outputIndexes": [ 1342 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_128_output_0", "inputIndexes": [ 1339, 1342 ] , "outputIndexes": [ 1343 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_114_output_0", "inputIndexes": [ 1343, 58 ] , "outputIndexes": [ 1344 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_199_output_0", "inputIndexes": [ 1343 ] , "outputIndexes": [ 1345 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5340", "inputIndexes": [ 1345 ] , "outputIndexes": [ 1346 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5342", "inputIndexes": [ 1345 ] , "outputIndexes": [ 1347 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5344", "inputIndexes": [ 1347, 1347 ] , "outputIndexes": [ 1348 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5345", "inputIndexes": [ 1348 ] , "outputIndexes": [ 1349 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5347", "inputIndexes": [ 1348, 12 ] , "outputIndexes": [ 1350 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5348", "inputIndexes": [ 1350 ] , "outputIndexes": [ 1351 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5351", "inputIndexes": [ 1346, 1349, 1351, 15 ] , "outputIndexes": [ 1352 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5352", "inputIndexes": [ 1352 ] , "outputIndexes": [ 1353 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5353", "inputIndexes": [ 61, 1353 ] , "outputIndexes": [ 1354 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5354", "inputIndexes": [ 1354, 1353 ] , "outputIndexes": [ 1355 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_216_output_0", "inputIndexes": [ 1345, 1355, 1348 ] , "outputIndexes": [ 1356 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_43_output_0", "inputIndexes": [ 1356, 73 ] , "outputIndexes": [ 1357 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_457_output_0", "inputIndexes": [ 1357, 20 ] , "outputIndexes": [ 1358 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_59_output_0", "inputIndexes": [ 1343, 1358, 76, 77, 15 ] , "outputIndexes": [ 1359 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_29_output_0", "inputIndexes": [ 1359 ] , "outputIndexes": [ 1360 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_456_output_0", "inputIndexes": [ 1357, 20 ] , "outputIndexes": [ 1361 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_58_output_0", "inputIndexes": [ 1343, 20, 1361, 77, 15 ] , "outputIndexes": [ 1362 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_186_output_0", "inputIndexes": [ 1360, 1362 ] , "outputIndexes": [ 1363 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_115_output_0", "inputIndexes": [ 1363, 89 ] , "outputIndexes": [ 1364 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_71_output_0", "inputIndexes": [ 1344, 1364 ] , "outputIndexes": [ 1365 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/self_attn/v_proj/Linear", "inputIndexes": [ 3113 ] , "outputIndexes": [ 3122 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 55621720, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3122 ] , "outputIndexes": [ 3123 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3123 ] , "outputIndexes": [ 1366 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_452_output_0", "inputIndexes": [ 1305, 20 ] , "outputIndexes": [ 1367 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_453_output_0", "inputIndexes": [ 1313, 20 ] , "outputIndexes": [ 1368 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_184_output_0", "inputIndexes": [ 1367, 1368, 77, 31 ] , "outputIndexes": [ 1369 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_129_output_0", "inputIndexes": [ 1366, 1369 ] , "outputIndexes": [ 1370 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_134_output_0", "inputIndexes": [ 1338, 1365, 1370, 124 ] , "outputIndexes": [ 1371 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1371 ] , "outputIndexes": [ 3124 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3124 ] , "outputIndexes": [ 3125 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/self_attn/o_proj/Linear", "inputIndexes": [ 3125 ] , "outputIndexes": [ 3126 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 55746398, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3126 ] , "outputIndexes": [ 3127 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3127 ] , "outputIndexes": [ 1372 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_73_output_0", "inputIndexes": [ 1292, 1372 ] , "outputIndexes": [ 1373 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_14/Mul_1_output_0", "inputIndexes": [ 1373 ] , "outputIndexes": [ 1374 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 56119908, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1374 ] , "outputIndexes": [ 3128 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3128 ] , "outputIndexes": [ 3129 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/mlp/gate_proj/Linear", "inputIndexes": [ 3129 ] , "outputIndexes": [ 3130 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56124516, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3130 ] , "outputIndexes": [ 3131 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3131 ] , "outputIndexes": [ 1375 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_14/Mul_output_0", "inputIndexes": [ 1375 ] , "outputIndexes": [ 1376 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/mlp/up_proj/Linear", "inputIndexes": [ 3129 ] , "outputIndexes": [ 3134 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 57120106, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3134 ] , "outputIndexes": [ 3135 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3135 ] , "outputIndexes": [ 1377 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_14/Mul_output_0", "inputIndexes": [ 1376, 1377 ] , "outputIndexes": [ 1378 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1378 ] , "outputIndexes": [ 3136 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3136 ] , "outputIndexes": [ 3137 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.14/mlp/down_proj/Linear", "inputIndexes": [ 3137 ] , "outputIndexes": [ 3138 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 58115696, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.14/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3138 ] , "outputIndexes": [ 3139 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3139 ] , "outputIndexes": [ 1379 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_74_output_0", "inputIndexes": [ 1373, 1379 ] , "outputIndexes": [ 1380 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_135_output_0", "inputIndexes": [ 1380, 3 ] , "outputIndexes": [ 1381 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_15/Mul_1_output_0", "inputIndexes": [ 1381 ] , "outputIndexes": [ 1382 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 59055990, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1382 ] , "outputIndexes": [ 3140 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3140 ] , "outputIndexes": [ 3141 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/self_attn/q_proj/Linear", "inputIndexes": [ 3141 ] , "outputIndexes": [ 3142 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 59060598, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3142 ] , "outputIndexes": [ 3143 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3143 ] , "outputIndexes": [ 1383 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_210_output_0", "inputIndexes": [ 1382 ] , "outputIndexes": [ 1384 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5673", "inputIndexes": [ 1384 ] , "outputIndexes": [ 1385 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5675", "inputIndexes": [ 1384 ] , "outputIndexes": [ 1386 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5677", "inputIndexes": [ 1386, 1386 ] , "outputIndexes": [ 1387 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5678", "inputIndexes": [ 1387 ] , "outputIndexes": [ 1388 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5680", "inputIndexes": [ 1387, 12 ] , "outputIndexes": [ 1389 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5681", "inputIndexes": [ 1389 ] , "outputIndexes": [ 1390 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5684", "inputIndexes": [ 1385, 1388, 1390, 15 ] , "outputIndexes": [ 1391 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5685", "inputIndexes": [ 1391 ] , "outputIndexes": [ 1392 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5687", "inputIndexes": [ 1392, 1392 ] , "outputIndexes": [ 1393 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_228_output_0", "inputIndexes": [ 1384, 1393, 1387 ] , "outputIndexes": [ 1394 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_480_output_0", "inputIndexes": [ 1394, 20 ] , "outputIndexes": [ 1395 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5695", "inputIndexes": [ 1387 ] , "outputIndexes": [ 1396 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5698", "inputIndexes": [ 1389 ] , "outputIndexes": [ 1397 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5701", "inputIndexes": [ 1385, 1396, 1397, 15 ] , "outputIndexes": [ 1398 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5702", "inputIndexes": [ 1398 ] , "outputIndexes": [ 1399 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5703", "inputIndexes": [ 12, 1399 ] , "outputIndexes": [ 1400 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5704", "inputIndexes": [ 1400, 1399 ] , "outputIndexes": [ 1401 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_229_output_0", "inputIndexes": [ 1384, 1401, 1387 ] , "outputIndexes": [ 1402 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_481_output_0", "inputIndexes": [ 1402, 20 ] , "outputIndexes": [ 1403 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_195_output_0", "inputIndexes": [ 1395, 1403, 30, 31 ] , "outputIndexes": [ 1404 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_136_output_0", "inputIndexes": [ 1383, 1404 ] , "outputIndexes": [ 1405 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_120_output_0", "inputIndexes": [ 1405, 58 ] , "outputIndexes": [ 1406 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_212_output_0", "inputIndexes": [ 1405 ] , "outputIndexes": [ 1407 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5805", "inputIndexes": [ 1407 ] , "outputIndexes": [ 1408 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5807", "inputIndexes": [ 1407 ] , "outputIndexes": [ 1409 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5809", "inputIndexes": [ 1409, 1409 ] , "outputIndexes": [ 1410 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5810", "inputIndexes": [ 1410 ] , "outputIndexes": [ 1411 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5812", "inputIndexes": [ 1410, 12 ] , "outputIndexes": [ 1412 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5813", "inputIndexes": [ 1412 ] , "outputIndexes": [ 1413 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5816", "inputIndexes": [ 1408, 1411, 1413, 15 ] , "outputIndexes": [ 1414 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5817", "inputIndexes": [ 1414 ] , "outputIndexes": [ 1415 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5818", "inputIndexes": [ 61, 1415 ] , "outputIndexes": [ 1416 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5819", "inputIndexes": [ 1416, 1415 ] , "outputIndexes": [ 1417 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_230_output_0", "inputIndexes": [ 1407, 1417, 1410 ] , "outputIndexes": [ 1418 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_45_output_0", "inputIndexes": [ 1418, 73 ] , "outputIndexes": [ 1419 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_487_output_0", "inputIndexes": [ 1419, 20 ] , "outputIndexes": [ 1420 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_61_output_0", "inputIndexes": [ 1405, 1420, 76, 77, 15 ] , "outputIndexes": [ 1421 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_30_output_0", "inputIndexes": [ 1421 ] , "outputIndexes": [ 1422 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_486_output_0", "inputIndexes": [ 1419, 20 ] , "outputIndexes": [ 1423 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_60_output_0", "inputIndexes": [ 1405, 20, 1423, 77, 15 ] , "outputIndexes": [ 1424 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_198_output_0", "inputIndexes": [ 1422, 1424 ] , "outputIndexes": [ 1425 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_121_output_0", "inputIndexes": [ 1425, 89 ] , "outputIndexes": [ 1426 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_75_output_0", "inputIndexes": [ 1406, 1426 ] , "outputIndexes": [ 1427 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/self_attn/k_proj/Linear", "inputIndexes": [ 3141 ] , "outputIndexes": [ 3146 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 59434108, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3146 ] , "outputIndexes": [ 3147 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3147 ] , "outputIndexes": [ 1428 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_482_output_0", "inputIndexes": [ 1394, 20 ] , "outputIndexes": [ 1429 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_483_output_0", "inputIndexes": [ 1402, 20 ] , "outputIndexes": [ 1430 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_196_output_0", "inputIndexes": [ 1429, 1430, 77, 31 ] , "outputIndexes": [ 1431 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_137_output_0", "inputIndexes": [ 1428, 1431 ] , "outputIndexes": [ 1432 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_122_output_0", "inputIndexes": [ 1432, 58 ] , "outputIndexes": [ 1433 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_213_output_0", "inputIndexes": [ 1432 ] , "outputIndexes": [ 1434 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape5711", "inputIndexes": [ 1434 ] , "outputIndexes": [ 1435 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank5713", "inputIndexes": [ 1434 ] , "outputIndexes": [ 1436 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5715", "inputIndexes": [ 1436, 1436 ] , "outputIndexes": [ 1437 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5716", "inputIndexes": [ 1437 ] , "outputIndexes": [ 1438 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5718", "inputIndexes": [ 1437, 12 ] , "outputIndexes": [ 1439 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze5719", "inputIndexes": [ 1439 ] , "outputIndexes": [ 1440 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice5722", "inputIndexes": [ 1435, 1438, 1440, 15 ] , "outputIndexes": [ 1441 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze5723", "inputIndexes": [ 1441 ] , "outputIndexes": [ 1442 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5724", "inputIndexes": [ 61, 1442 ] , "outputIndexes": [ 1443 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp5725", "inputIndexes": [ 1443, 1442 ] , "outputIndexes": [ 1444 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_231_output_0", "inputIndexes": [ 1434, 1444, 1437 ] , "outputIndexes": [ 1445 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_46_output_0", "inputIndexes": [ 1445, 73 ] , "outputIndexes": [ 1446 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_489_output_0", "inputIndexes": [ 1446, 20 ] , "outputIndexes": [ 1447 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_63_output_0", "inputIndexes": [ 1432, 1447, 76, 77, 15 ] , "outputIndexes": [ 1448 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_31_output_0", "inputIndexes": [ 1448 ] , "outputIndexes": [ 1449 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_488_output_0", "inputIndexes": [ 1446, 20 ] , "outputIndexes": [ 1450 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_62_output_0", "inputIndexes": [ 1432, 20, 1450, 77, 15 ] , "outputIndexes": [ 1451 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_199_output_0", "inputIndexes": [ 1449, 1451 ] , "outputIndexes": [ 1452 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_123_output_0", "inputIndexes": [ 1452, 89 ] , "outputIndexes": [ 1453 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_76_output_0", "inputIndexes": [ 1433, 1453 ] , "outputIndexes": [ 1454 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/self_attn/v_proj/Linear", "inputIndexes": [ 3141 ] , "outputIndexes": [ 3150 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 59558786, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3150 ] , "outputIndexes": [ 3151 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3151 ] , "outputIndexes": [ 1455 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_484_output_0", "inputIndexes": [ 1394, 20 ] , "outputIndexes": [ 1456 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_485_output_0", "inputIndexes": [ 1402, 20 ] , "outputIndexes": [ 1457 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_197_output_0", "inputIndexes": [ 1456, 1457, 77, 31 ] , "outputIndexes": [ 1458 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_138_output_0", "inputIndexes": [ 1455, 1458 ] , "outputIndexes": [ 1459 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_143_output_0", "inputIndexes": [ 1427, 1454, 1459, 124 ] , "outputIndexes": [ 1460 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1460 ] , "outputIndexes": [ 3152 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3152 ] , "outputIndexes": [ 3153 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/self_attn/o_proj/Linear", "inputIndexes": [ 3153 ] , "outputIndexes": [ 3154 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 59683464, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3154 ] , "outputIndexes": [ 3155 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3155 ] , "outputIndexes": [ 1461 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_78_output_0", "inputIndexes": [ 1381, 1461 ] , "outputIndexes": [ 1462 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_15/Mul_1_output_0", "inputIndexes": [ 1462 ] , "outputIndexes": [ 1463 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 60056974, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1463 ] , "outputIndexes": [ 3156 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3156 ] , "outputIndexes": [ 3157 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/mlp/gate_proj/Linear", "inputIndexes": [ 3157 ] , "outputIndexes": [ 3158 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 60061582, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3158 ] , "outputIndexes": [ 3159 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3159 ] , "outputIndexes": [ 1464 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_15/Mul_output_0", "inputIndexes": [ 1464 ] , "outputIndexes": [ 1465 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/mlp/up_proj/Linear", "inputIndexes": [ 3157 ] , "outputIndexes": [ 3162 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 61057172, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3162 ] , "outputIndexes": [ 3163 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3163 ] , "outputIndexes": [ 1466 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_15/Mul_output_0", "inputIndexes": [ 1465, 1466 ] , "outputIndexes": [ 1467 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1467 ] , "outputIndexes": [ 3164 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3164 ] , "outputIndexes": [ 3165 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.15/mlp/down_proj/Linear", "inputIndexes": [ 3165 ] , "outputIndexes": [ 3166 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 62052762, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.15/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3166 ] , "outputIndexes": [ 3167 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3167 ] , "outputIndexes": [ 1468 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_79_output_0", "inputIndexes": [ 1462, 1468 ] , "outputIndexes": [ 1469 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_144_output_0", "inputIndexes": [ 1469, 3 ] , "outputIndexes": [ 1470 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_16/Mul_1_output_0", "inputIndexes": [ 1470 ] , "outputIndexes": [ 1471 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 62993056, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1471 ] , "outputIndexes": [ 3168 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3168 ] , "outputIndexes": [ 3169 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/self_attn/q_proj/Linear", "inputIndexes": [ 3169 ] , "outputIndexes": [ 3170 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 62997664, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3170 ] , "outputIndexes": [ 3171 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3171 ] , "outputIndexes": [ 1472 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_224_output_0", "inputIndexes": [ 1471 ] , "outputIndexes": [ 1473 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6044", "inputIndexes": [ 1473 ] , "outputIndexes": [ 1474 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6046", "inputIndexes": [ 1473 ] , "outputIndexes": [ 1475 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6048", "inputIndexes": [ 1475, 1475 ] , "outputIndexes": [ 1476 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6049", "inputIndexes": [ 1476 ] , "outputIndexes": [ 1477 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6051", "inputIndexes": [ 1476, 12 ] , "outputIndexes": [ 1478 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6052", "inputIndexes": [ 1478 ] , "outputIndexes": [ 1479 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6055", "inputIndexes": [ 1474, 1477, 1479, 15 ] , "outputIndexes": [ 1480 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6056", "inputIndexes": [ 1480 ] , "outputIndexes": [ 1481 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6058", "inputIndexes": [ 1481, 1481 ] , "outputIndexes": [ 1482 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_243_output_0", "inputIndexes": [ 1473, 1482, 1476 ] , "outputIndexes": [ 1483 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_512_output_0", "inputIndexes": [ 1483, 20 ] , "outputIndexes": [ 1484 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6066", "inputIndexes": [ 1476 ] , "outputIndexes": [ 1485 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6069", "inputIndexes": [ 1478 ] , "outputIndexes": [ 1486 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6072", "inputIndexes": [ 1474, 1485, 1486, 15 ] , "outputIndexes": [ 1487 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6073", "inputIndexes": [ 1487 ] , "outputIndexes": [ 1488 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6074", "inputIndexes": [ 12, 1488 ] , "outputIndexes": [ 1489 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6075", "inputIndexes": [ 1489, 1488 ] , "outputIndexes": [ 1490 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_244_output_0", "inputIndexes": [ 1473, 1490, 1476 ] , "outputIndexes": [ 1491 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_513_output_0", "inputIndexes": [ 1491, 20 ] , "outputIndexes": [ 1492 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_208_output_0", "inputIndexes": [ 1484, 1492, 30, 31 ] , "outputIndexes": [ 1493 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_145_output_0", "inputIndexes": [ 1472, 1493 ] , "outputIndexes": [ 1494 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_128_output_0", "inputIndexes": [ 1494, 58 ] , "outputIndexes": [ 1495 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_226_output_0", "inputIndexes": [ 1494 ] , "outputIndexes": [ 1496 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6176", "inputIndexes": [ 1496 ] , "outputIndexes": [ 1497 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6178", "inputIndexes": [ 1496 ] , "outputIndexes": [ 1498 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6180", "inputIndexes": [ 1498, 1498 ] , "outputIndexes": [ 1499 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6181", "inputIndexes": [ 1499 ] , "outputIndexes": [ 1500 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6183", "inputIndexes": [ 1499, 12 ] , "outputIndexes": [ 1501 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6184", "inputIndexes": [ 1501 ] , "outputIndexes": [ 1502 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6187", "inputIndexes": [ 1497, 1500, 1502, 15 ] , "outputIndexes": [ 1503 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6188", "inputIndexes": [ 1503 ] , "outputIndexes": [ 1504 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6189", "inputIndexes": [ 61, 1504 ] , "outputIndexes": [ 1505 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6190", "inputIndexes": [ 1505, 1504 ] , "outputIndexes": [ 1506 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_245_output_0", "inputIndexes": [ 1496, 1506, 1499 ] , "outputIndexes": [ 1507 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_48_output_0", "inputIndexes": [ 1507, 73 ] , "outputIndexes": [ 1508 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_519_output_0", "inputIndexes": [ 1508, 20 ] , "outputIndexes": [ 1509 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_65_output_0", "inputIndexes": [ 1494, 1509, 76, 77, 15 ] , "outputIndexes": [ 1510 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_32_output_0", "inputIndexes": [ 1510 ] , "outputIndexes": [ 1511 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_518_output_0", "inputIndexes": [ 1508, 20 ] , "outputIndexes": [ 1512 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_64_output_0", "inputIndexes": [ 1494, 20, 1512, 77, 15 ] , "outputIndexes": [ 1513 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_211_output_0", "inputIndexes": [ 1511, 1513 ] , "outputIndexes": [ 1514 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_129_output_0", "inputIndexes": [ 1514, 89 ] , "outputIndexes": [ 1515 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_80_output_0", "inputIndexes": [ 1495, 1515 ] , "outputIndexes": [ 1516 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/self_attn/k_proj/Linear", "inputIndexes": [ 3169 ] , "outputIndexes": [ 3174 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63371174, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3174 ] , "outputIndexes": [ 3175 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3175 ] , "outputIndexes": [ 1517 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_514_output_0", "inputIndexes": [ 1483, 20 ] , "outputIndexes": [ 1518 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_515_output_0", "inputIndexes": [ 1491, 20 ] , "outputIndexes": [ 1519 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_209_output_0", "inputIndexes": [ 1518, 1519, 77, 31 ] , "outputIndexes": [ 1520 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_146_output_0", "inputIndexes": [ 1517, 1520 ] , "outputIndexes": [ 1521 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_130_output_0", "inputIndexes": [ 1521, 58 ] , "outputIndexes": [ 1522 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_227_output_0", "inputIndexes": [ 1521 ] , "outputIndexes": [ 1523 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6082", "inputIndexes": [ 1523 ] , "outputIndexes": [ 1524 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6084", "inputIndexes": [ 1523 ] , "outputIndexes": [ 1525 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6086", "inputIndexes": [ 1525, 1525 ] , "outputIndexes": [ 1526 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6087", "inputIndexes": [ 1526 ] , "outputIndexes": [ 1527 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6089", "inputIndexes": [ 1526, 12 ] , "outputIndexes": [ 1528 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6090", "inputIndexes": [ 1528 ] , "outputIndexes": [ 1529 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6093", "inputIndexes": [ 1524, 1527, 1529, 15 ] , "outputIndexes": [ 1530 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6094", "inputIndexes": [ 1530 ] , "outputIndexes": [ 1531 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6095", "inputIndexes": [ 61, 1531 ] , "outputIndexes": [ 1532 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6096", "inputIndexes": [ 1532, 1531 ] , "outputIndexes": [ 1533 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_246_output_0", "inputIndexes": [ 1523, 1533, 1526 ] , "outputIndexes": [ 1534 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_49_output_0", "inputIndexes": [ 1534, 73 ] , "outputIndexes": [ 1535 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_521_output_0", "inputIndexes": [ 1535, 20 ] , "outputIndexes": [ 1536 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_67_output_0", "inputIndexes": [ 1521, 1536, 76, 77, 15 ] , "outputIndexes": [ 1537 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_33_output_0", "inputIndexes": [ 1537 ] , "outputIndexes": [ 1538 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_520_output_0", "inputIndexes": [ 1535, 20 ] , "outputIndexes": [ 1539 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_66_output_0", "inputIndexes": [ 1521, 20, 1539, 77, 15 ] , "outputIndexes": [ 1540 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_212_output_0", "inputIndexes": [ 1538, 1540 ] , "outputIndexes": [ 1541 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_131_output_0", "inputIndexes": [ 1541, 89 ] , "outputIndexes": [ 1542 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_81_output_0", "inputIndexes": [ 1522, 1542 ] , "outputIndexes": [ 1543 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/self_attn/v_proj/Linear", "inputIndexes": [ 3169 ] , "outputIndexes": [ 3178 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63495852, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3178 ] , "outputIndexes": [ 3179 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3179 ] , "outputIndexes": [ 1544 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_516_output_0", "inputIndexes": [ 1483, 20 ] , "outputIndexes": [ 1545 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_517_output_0", "inputIndexes": [ 1491, 20 ] , "outputIndexes": [ 1546 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_210_output_0", "inputIndexes": [ 1545, 1546, 77, 31 ] , "outputIndexes": [ 1547 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_147_output_0", "inputIndexes": [ 1544, 1547 ] , "outputIndexes": [ 1548 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_152_output_0", "inputIndexes": [ 1516, 1543, 1548, 124 ] , "outputIndexes": [ 1549 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1549 ] , "outputIndexes": [ 3180 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3180 ] , "outputIndexes": [ 3181 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/self_attn/o_proj/Linear", "inputIndexes": [ 3181 ] , "outputIndexes": [ 3182 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63620530, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3182 ] , "outputIndexes": [ 3183 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3183 ] , "outputIndexes": [ 1550 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_83_output_0", "inputIndexes": [ 1470, 1550 ] , "outputIndexes": [ 1551 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_16/Mul_1_output_0", "inputIndexes": [ 1551 ] , "outputIndexes": [ 1552 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 63994040, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1552 ] , "outputIndexes": [ 3184 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3184 ] , "outputIndexes": [ 3185 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/mlp/gate_proj/Linear", "inputIndexes": [ 3185 ] , "outputIndexes": [ 3186 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 63998648, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3186 ] , "outputIndexes": [ 3187 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3187 ] , "outputIndexes": [ 1553 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_16/Mul_output_0", "inputIndexes": [ 1553 ] , "outputIndexes": [ 1554 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/mlp/up_proj/Linear", "inputIndexes": [ 3185 ] , "outputIndexes": [ 3190 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 64994238, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3190 ] , "outputIndexes": [ 3191 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3191 ] , "outputIndexes": [ 1555 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_16/Mul_output_0", "inputIndexes": [ 1554, 1555 ] , "outputIndexes": [ 1556 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1556 ] , "outputIndexes": [ 3192 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3192 ] , "outputIndexes": [ 3193 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.16/mlp/down_proj/Linear", "inputIndexes": [ 3193 ] , "outputIndexes": [ 3194 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65989828, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.16/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3194 ] , "outputIndexes": [ 3195 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3195 ] , "outputIndexes": [ 1557 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_84_output_0", "inputIndexes": [ 1551, 1557 ] , "outputIndexes": [ 1558 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_153_output_0", "inputIndexes": [ 1558, 3 ] , "outputIndexes": [ 1559 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_17/Mul_1_output_0", "inputIndexes": [ 1559 ] , "outputIndexes": [ 1560 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 66930122, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1560 ] , "outputIndexes": [ 3196 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3196 ] , "outputIndexes": [ 3197 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/self_attn/q_proj/Linear", "inputIndexes": [ 3197 ] , "outputIndexes": [ 3198 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 66934730, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3198 ] , "outputIndexes": [ 3199 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3199 ] , "outputIndexes": [ 1561 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_238_output_0", "inputIndexes": [ 1560 ] , "outputIndexes": [ 1562 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6415", "inputIndexes": [ 1562 ] , "outputIndexes": [ 1563 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6417", "inputIndexes": [ 1562 ] , "outputIndexes": [ 1564 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6419", "inputIndexes": [ 1564, 1564 ] , "outputIndexes": [ 1565 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6420", "inputIndexes": [ 1565 ] , "outputIndexes": [ 1566 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6422", "inputIndexes": [ 1565, 12 ] , "outputIndexes": [ 1567 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6423", "inputIndexes": [ 1567 ] , "outputIndexes": [ 1568 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6426", "inputIndexes": [ 1563, 1566, 1568, 15 ] , "outputIndexes": [ 1569 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6427", "inputIndexes": [ 1569 ] , "outputIndexes": [ 1570 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6429", "inputIndexes": [ 1570, 1570 ] , "outputIndexes": [ 1571 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_258_output_0", "inputIndexes": [ 1562, 1571, 1565 ] , "outputIndexes": [ 1572 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_544_output_0", "inputIndexes": [ 1572, 20 ] , "outputIndexes": [ 1573 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6437", "inputIndexes": [ 1565 ] , "outputIndexes": [ 1574 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6440", "inputIndexes": [ 1567 ] , "outputIndexes": [ 1575 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6443", "inputIndexes": [ 1563, 1574, 1575, 15 ] , "outputIndexes": [ 1576 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6444", "inputIndexes": [ 1576 ] , "outputIndexes": [ 1577 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6445", "inputIndexes": [ 12, 1577 ] , "outputIndexes": [ 1578 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6446", "inputIndexes": [ 1578, 1577 ] , "outputIndexes": [ 1579 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_259_output_0", "inputIndexes": [ 1562, 1579, 1565 ] , "outputIndexes": [ 1580 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_545_output_0", "inputIndexes": [ 1580, 20 ] , "outputIndexes": [ 1581 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_221_output_0", "inputIndexes": [ 1573, 1581, 30, 31 ] , "outputIndexes": [ 1582 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_154_output_0", "inputIndexes": [ 1561, 1582 ] , "outputIndexes": [ 1583 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_136_output_0", "inputIndexes": [ 1583, 58 ] , "outputIndexes": [ 1584 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_240_output_0", "inputIndexes": [ 1583 ] , "outputIndexes": [ 1585 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6547", "inputIndexes": [ 1585 ] , "outputIndexes": [ 1586 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6549", "inputIndexes": [ 1585 ] , "outputIndexes": [ 1587 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6551", "inputIndexes": [ 1587, 1587 ] , "outputIndexes": [ 1588 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6552", "inputIndexes": [ 1588 ] , "outputIndexes": [ 1589 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6554", "inputIndexes": [ 1588, 12 ] , "outputIndexes": [ 1590 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6555", "inputIndexes": [ 1590 ] , "outputIndexes": [ 1591 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6558", "inputIndexes": [ 1586, 1589, 1591, 15 ] , "outputIndexes": [ 1592 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6559", "inputIndexes": [ 1592 ] , "outputIndexes": [ 1593 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6560", "inputIndexes": [ 61, 1593 ] , "outputIndexes": [ 1594 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6561", "inputIndexes": [ 1594, 1593 ] , "outputIndexes": [ 1595 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_260_output_0", "inputIndexes": [ 1585, 1595, 1588 ] , "outputIndexes": [ 1596 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_51_output_0", "inputIndexes": [ 1596, 73 ] , "outputIndexes": [ 1597 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_551_output_0", "inputIndexes": [ 1597, 20 ] , "outputIndexes": [ 1598 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_69_output_0", "inputIndexes": [ 1583, 1598, 76, 77, 15 ] , "outputIndexes": [ 1599 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_34_output_0", "inputIndexes": [ 1599 ] , "outputIndexes": [ 1600 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_550_output_0", "inputIndexes": [ 1597, 20 ] , "outputIndexes": [ 1601 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_68_output_0", "inputIndexes": [ 1583, 20, 1601, 77, 15 ] , "outputIndexes": [ 1602 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_224_output_0", "inputIndexes": [ 1600, 1602 ] , "outputIndexes": [ 1603 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_137_output_0", "inputIndexes": [ 1603, 89 ] , "outputIndexes": [ 1604 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_85_output_0", "inputIndexes": [ 1584, 1604 ] , "outputIndexes": [ 1605 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/self_attn/k_proj/Linear", "inputIndexes": [ 3197 ] , "outputIndexes": [ 3202 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 67308240, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3202 ] , "outputIndexes": [ 3203 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3203 ] , "outputIndexes": [ 1606 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_546_output_0", "inputIndexes": [ 1572, 20 ] , "outputIndexes": [ 1607 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_547_output_0", "inputIndexes": [ 1580, 20 ] , "outputIndexes": [ 1608 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_222_output_0", "inputIndexes": [ 1607, 1608, 77, 31 ] , "outputIndexes": [ 1609 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_155_output_0", "inputIndexes": [ 1606, 1609 ] , "outputIndexes": [ 1610 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_138_output_0", "inputIndexes": [ 1610, 58 ] , "outputIndexes": [ 1611 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_241_output_0", "inputIndexes": [ 1610 ] , "outputIndexes": [ 1612 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6453", "inputIndexes": [ 1612 ] , "outputIndexes": [ 1613 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6455", "inputIndexes": [ 1612 ] , "outputIndexes": [ 1614 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6457", "inputIndexes": [ 1614, 1614 ] , "outputIndexes": [ 1615 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6458", "inputIndexes": [ 1615 ] , "outputIndexes": [ 1616 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6460", "inputIndexes": [ 1615, 12 ] , "outputIndexes": [ 1617 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6461", "inputIndexes": [ 1617 ] , "outputIndexes": [ 1618 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6464", "inputIndexes": [ 1613, 1616, 1618, 15 ] , "outputIndexes": [ 1619 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6465", "inputIndexes": [ 1619 ] , "outputIndexes": [ 1620 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6466", "inputIndexes": [ 61, 1620 ] , "outputIndexes": [ 1621 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6467", "inputIndexes": [ 1621, 1620 ] , "outputIndexes": [ 1622 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_261_output_0", "inputIndexes": [ 1612, 1622, 1615 ] , "outputIndexes": [ 1623 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_52_output_0", "inputIndexes": [ 1623, 73 ] , "outputIndexes": [ 1624 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_553_output_0", "inputIndexes": [ 1624, 20 ] , "outputIndexes": [ 1625 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_71_output_0", "inputIndexes": [ 1610, 1625, 76, 77, 15 ] , "outputIndexes": [ 1626 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_35_output_0", "inputIndexes": [ 1626 ] , "outputIndexes": [ 1627 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_552_output_0", "inputIndexes": [ 1624, 20 ] , "outputIndexes": [ 1628 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_70_output_0", "inputIndexes": [ 1610, 20, 1628, 77, 15 ] , "outputIndexes": [ 1629 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_225_output_0", "inputIndexes": [ 1627, 1629 ] , "outputIndexes": [ 1630 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_139_output_0", "inputIndexes": [ 1630, 89 ] , "outputIndexes": [ 1631 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_86_output_0", "inputIndexes": [ 1611, 1631 ] , "outputIndexes": [ 1632 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/self_attn/v_proj/Linear", "inputIndexes": [ 3197 ] , "outputIndexes": [ 3206 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 67432918, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3206 ] , "outputIndexes": [ 3207 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3207 ] , "outputIndexes": [ 1633 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_548_output_0", "inputIndexes": [ 1572, 20 ] , "outputIndexes": [ 1634 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_549_output_0", "inputIndexes": [ 1580, 20 ] , "outputIndexes": [ 1635 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_223_output_0", "inputIndexes": [ 1634, 1635, 77, 31 ] , "outputIndexes": [ 1636 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_156_output_0", "inputIndexes": [ 1633, 1636 ] , "outputIndexes": [ 1637 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_161_output_0", "inputIndexes": [ 1605, 1632, 1637, 124 ] , "outputIndexes": [ 1638 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1638 ] , "outputIndexes": [ 3208 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3208 ] , "outputIndexes": [ 3209 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/self_attn/o_proj/Linear", "inputIndexes": [ 3209 ] , "outputIndexes": [ 3210 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 67557596, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3210 ] , "outputIndexes": [ 3211 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3211 ] , "outputIndexes": [ 1639 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_88_output_0", "inputIndexes": [ 1559, 1639 ] , "outputIndexes": [ 1640 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_17/Mul_1_output_0", "inputIndexes": [ 1640 ] , "outputIndexes": [ 1641 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 67931106, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1641 ] , "outputIndexes": [ 3212 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3212 ] , "outputIndexes": [ 3213 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/mlp/gate_proj/Linear", "inputIndexes": [ 3213 ] , "outputIndexes": [ 3214 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 67935714, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3214 ] , "outputIndexes": [ 3215 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3215 ] , "outputIndexes": [ 1642 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_17/Mul_output_0", "inputIndexes": [ 1642 ] , "outputIndexes": [ 1643 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/mlp/up_proj/Linear", "inputIndexes": [ 3213 ] , "outputIndexes": [ 3218 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 68931304, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3218 ] , "outputIndexes": [ 3219 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3219 ] , "outputIndexes": [ 1644 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_17/Mul_output_0", "inputIndexes": [ 1643, 1644 ] , "outputIndexes": [ 1645 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1645 ] , "outputIndexes": [ 3220 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3220 ] , "outputIndexes": [ 3221 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.17/mlp/down_proj/Linear", "inputIndexes": [ 3221 ] , "outputIndexes": [ 3222 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 69926894, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.17/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3222 ] , "outputIndexes": [ 3223 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3223 ] , "outputIndexes": [ 1646 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_89_output_0", "inputIndexes": [ 1640, 1646 ] , "outputIndexes": [ 1647 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_162_output_0", "inputIndexes": [ 1647, 3 ] , "outputIndexes": [ 1648 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_18/Mul_1_output_0", "inputIndexes": [ 1648 ] , "outputIndexes": [ 1649 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 70867188, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1649 ] , "outputIndexes": [ 3224 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3224 ] , "outputIndexes": [ 3225 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/self_attn/q_proj/Linear", "inputIndexes": [ 3225 ] , "outputIndexes": [ 3226 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 70871796, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3226 ] , "outputIndexes": [ 3227 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3227 ] , "outputIndexes": [ 1650 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_252_output_0", "inputIndexes": [ 1649 ] , "outputIndexes": [ 1651 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6786", "inputIndexes": [ 1651 ] , "outputIndexes": [ 1652 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6788", "inputIndexes": [ 1651 ] , "outputIndexes": [ 1653 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6790", "inputIndexes": [ 1653, 1653 ] , "outputIndexes": [ 1654 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6791", "inputIndexes": [ 1654 ] , "outputIndexes": [ 1655 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6793", "inputIndexes": [ 1654, 12 ] , "outputIndexes": [ 1656 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6794", "inputIndexes": [ 1656 ] , "outputIndexes": [ 1657 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6797", "inputIndexes": [ 1652, 1655, 1657, 15 ] , "outputIndexes": [ 1658 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6798", "inputIndexes": [ 1658 ] , "outputIndexes": [ 1659 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6800", "inputIndexes": [ 1659, 1659 ] , "outputIndexes": [ 1660 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_273_output_0", "inputIndexes": [ 1651, 1660, 1654 ] , "outputIndexes": [ 1661 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_576_output_0", "inputIndexes": [ 1661, 20 ] , "outputIndexes": [ 1662 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6808", "inputIndexes": [ 1654 ] , "outputIndexes": [ 1663 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6811", "inputIndexes": [ 1656 ] , "outputIndexes": [ 1664 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6814", "inputIndexes": [ 1652, 1663, 1664, 15 ] , "outputIndexes": [ 1665 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6815", "inputIndexes": [ 1665 ] , "outputIndexes": [ 1666 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6816", "inputIndexes": [ 12, 1666 ] , "outputIndexes": [ 1667 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6817", "inputIndexes": [ 1667, 1666 ] , "outputIndexes": [ 1668 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_274_output_0", "inputIndexes": [ 1651, 1668, 1654 ] , "outputIndexes": [ 1669 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_577_output_0", "inputIndexes": [ 1669, 20 ] , "outputIndexes": [ 1670 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_234_output_0", "inputIndexes": [ 1662, 1670, 30, 31 ] , "outputIndexes": [ 1671 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_163_output_0", "inputIndexes": [ 1650, 1671 ] , "outputIndexes": [ 1672 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_144_output_0", "inputIndexes": [ 1672, 58 ] , "outputIndexes": [ 1673 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_254_output_0", "inputIndexes": [ 1672 ] , "outputIndexes": [ 1674 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6918", "inputIndexes": [ 1674 ] , "outputIndexes": [ 1675 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6920", "inputIndexes": [ 1674 ] , "outputIndexes": [ 1676 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6922", "inputIndexes": [ 1676, 1676 ] , "outputIndexes": [ 1677 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6923", "inputIndexes": [ 1677 ] , "outputIndexes": [ 1678 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6925", "inputIndexes": [ 1677, 12 ] , "outputIndexes": [ 1679 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6926", "inputIndexes": [ 1679 ] , "outputIndexes": [ 1680 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6929", "inputIndexes": [ 1675, 1678, 1680, 15 ] , "outputIndexes": [ 1681 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6930", "inputIndexes": [ 1681 ] , "outputIndexes": [ 1682 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6931", "inputIndexes": [ 61, 1682 ] , "outputIndexes": [ 1683 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6932", "inputIndexes": [ 1683, 1682 ] , "outputIndexes": [ 1684 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_275_output_0", "inputIndexes": [ 1674, 1684, 1677 ] , "outputIndexes": [ 1685 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_54_output_0", "inputIndexes": [ 1685, 73 ] , "outputIndexes": [ 1686 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_583_output_0", "inputIndexes": [ 1686, 20 ] , "outputIndexes": [ 1687 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_73_output_0", "inputIndexes": [ 1672, 1687, 76, 77, 15 ] , "outputIndexes": [ 1688 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_36_output_0", "inputIndexes": [ 1688 ] , "outputIndexes": [ 1689 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_582_output_0", "inputIndexes": [ 1686, 20 ] , "outputIndexes": [ 1690 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_72_output_0", "inputIndexes": [ 1672, 20, 1690, 77, 15 ] , "outputIndexes": [ 1691 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_237_output_0", "inputIndexes": [ 1689, 1691 ] , "outputIndexes": [ 1692 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_145_output_0", "inputIndexes": [ 1692, 89 ] , "outputIndexes": [ 1693 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_90_output_0", "inputIndexes": [ 1673, 1693 ] , "outputIndexes": [ 1694 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/self_attn/k_proj/Linear", "inputIndexes": [ 3225 ] , "outputIndexes": [ 3230 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71245306, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3230 ] , "outputIndexes": [ 3231 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3231 ] , "outputIndexes": [ 1695 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_578_output_0", "inputIndexes": [ 1661, 20 ] , "outputIndexes": [ 1696 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_579_output_0", "inputIndexes": [ 1669, 20 ] , "outputIndexes": [ 1697 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_235_output_0", "inputIndexes": [ 1696, 1697, 77, 31 ] , "outputIndexes": [ 1698 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_164_output_0", "inputIndexes": [ 1695, 1698 ] , "outputIndexes": [ 1699 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_146_output_0", "inputIndexes": [ 1699, 58 ] , "outputIndexes": [ 1700 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_255_output_0", "inputIndexes": [ 1699 ] , "outputIndexes": [ 1701 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape6824", "inputIndexes": [ 1701 ] , "outputIndexes": [ 1702 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank6826", "inputIndexes": [ 1701 ] , "outputIndexes": [ 1703 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6828", "inputIndexes": [ 1703, 1703 ] , "outputIndexes": [ 1704 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6829", "inputIndexes": [ 1704 ] , "outputIndexes": [ 1705 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6831", "inputIndexes": [ 1704, 12 ] , "outputIndexes": [ 1706 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze6832", "inputIndexes": [ 1706 ] , "outputIndexes": [ 1707 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice6835", "inputIndexes": [ 1702, 1705, 1707, 15 ] , "outputIndexes": [ 1708 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze6836", "inputIndexes": [ 1708 ] , "outputIndexes": [ 1709 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6837", "inputIndexes": [ 61, 1709 ] , "outputIndexes": [ 1710 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp6838", "inputIndexes": [ 1710, 1709 ] , "outputIndexes": [ 1711 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_276_output_0", "inputIndexes": [ 1701, 1711, 1704 ] , "outputIndexes": [ 1712 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_55_output_0", "inputIndexes": [ 1712, 73 ] , "outputIndexes": [ 1713 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_585_output_0", "inputIndexes": [ 1713, 20 ] , "outputIndexes": [ 1714 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_75_output_0", "inputIndexes": [ 1699, 1714, 76, 77, 15 ] , "outputIndexes": [ 1715 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_37_output_0", "inputIndexes": [ 1715 ] , "outputIndexes": [ 1716 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_584_output_0", "inputIndexes": [ 1713, 20 ] , "outputIndexes": [ 1717 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_74_output_0", "inputIndexes": [ 1699, 20, 1717, 77, 15 ] , "outputIndexes": [ 1718 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_238_output_0", "inputIndexes": [ 1716, 1718 ] , "outputIndexes": [ 1719 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_147_output_0", "inputIndexes": [ 1719, 89 ] , "outputIndexes": [ 1720 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_91_output_0", "inputIndexes": [ 1700, 1720 ] , "outputIndexes": [ 1721 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/self_attn/v_proj/Linear", "inputIndexes": [ 3225 ] , "outputIndexes": [ 3234 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71369984, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3234 ] , "outputIndexes": [ 3235 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3235 ] , "outputIndexes": [ 1722 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_580_output_0", "inputIndexes": [ 1661, 20 ] , "outputIndexes": [ 1723 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_581_output_0", "inputIndexes": [ 1669, 20 ] , "outputIndexes": [ 1724 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_236_output_0", "inputIndexes": [ 1723, 1724, 77, 31 ] , "outputIndexes": [ 1725 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_165_output_0", "inputIndexes": [ 1722, 1725 ] , "outputIndexes": [ 1726 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_170_output_0", "inputIndexes": [ 1694, 1721, 1726, 124 ] , "outputIndexes": [ 1727 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1727 ] , "outputIndexes": [ 3236 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3236 ] , "outputIndexes": [ 3237 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/self_attn/o_proj/Linear", "inputIndexes": [ 3237 ] , "outputIndexes": [ 3238 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71494662, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3238 ] , "outputIndexes": [ 3239 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3239 ] , "outputIndexes": [ 1728 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_93_output_0", "inputIndexes": [ 1648, 1728 ] , "outputIndexes": [ 1729 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_18/Mul_1_output_0", "inputIndexes": [ 1729 ] , "outputIndexes": [ 1730 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 71868172, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1730 ] , "outputIndexes": [ 3240 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3240 ] , "outputIndexes": [ 3241 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/mlp/gate_proj/Linear", "inputIndexes": [ 3241 ] , "outputIndexes": [ 3242 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71872780, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3242 ] , "outputIndexes": [ 3243 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3243 ] , "outputIndexes": [ 1731 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_18/Mul_output_0", "inputIndexes": [ 1731 ] , "outputIndexes": [ 1732 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/mlp/up_proj/Linear", "inputIndexes": [ 3241 ] , "outputIndexes": [ 3246 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 72868370, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3246 ] , "outputIndexes": [ 3247 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3247 ] , "outputIndexes": [ 1733 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_18/Mul_output_0", "inputIndexes": [ 1732, 1733 ] , "outputIndexes": [ 1734 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1734 ] , "outputIndexes": [ 3248 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3248 ] , "outputIndexes": [ 3249 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.18/mlp/down_proj/Linear", "inputIndexes": [ 3249 ] , "outputIndexes": [ 3250 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 73863960, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.18/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3250 ] , "outputIndexes": [ 3251 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3251 ] , "outputIndexes": [ 1735 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_94_output_0", "inputIndexes": [ 1729, 1735 ] , "outputIndexes": [ 1736 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_171_output_0", "inputIndexes": [ 1736, 3 ] , "outputIndexes": [ 1737 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_19/Mul_1_output_0", "inputIndexes": [ 1737 ] , "outputIndexes": [ 1738 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 74804254, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1738 ] , "outputIndexes": [ 3252 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3252 ] , "outputIndexes": [ 3253 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/self_attn/q_proj/Linear", "inputIndexes": [ 3253 ] , "outputIndexes": [ 3254 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 74808862, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3254 ] , "outputIndexes": [ 3255 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3255 ] , "outputIndexes": [ 1739 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_266_output_0", "inputIndexes": [ 1738 ] , "outputIndexes": [ 1740 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7157", "inputIndexes": [ 1740 ] , "outputIndexes": [ 1741 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7159", "inputIndexes": [ 1740 ] , "outputIndexes": [ 1742 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7161", "inputIndexes": [ 1742, 1742 ] , "outputIndexes": [ 1743 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7162", "inputIndexes": [ 1743 ] , "outputIndexes": [ 1744 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7164", "inputIndexes": [ 1743, 12 ] , "outputIndexes": [ 1745 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7165", "inputIndexes": [ 1745 ] , "outputIndexes": [ 1746 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7168", "inputIndexes": [ 1741, 1744, 1746, 15 ] , "outputIndexes": [ 1747 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7169", "inputIndexes": [ 1747 ] , "outputIndexes": [ 1748 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7171", "inputIndexes": [ 1748, 1748 ] , "outputIndexes": [ 1749 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_288_output_0", "inputIndexes": [ 1740, 1749, 1743 ] , "outputIndexes": [ 1750 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_608_output_0", "inputIndexes": [ 1750, 20 ] , "outputIndexes": [ 1751 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7179", "inputIndexes": [ 1743 ] , "outputIndexes": [ 1752 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7182", "inputIndexes": [ 1745 ] , "outputIndexes": [ 1753 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7185", "inputIndexes": [ 1741, 1752, 1753, 15 ] , "outputIndexes": [ 1754 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7186", "inputIndexes": [ 1754 ] , "outputIndexes": [ 1755 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7187", "inputIndexes": [ 12, 1755 ] , "outputIndexes": [ 1756 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7188", "inputIndexes": [ 1756, 1755 ] , "outputIndexes": [ 1757 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_289_output_0", "inputIndexes": [ 1740, 1757, 1743 ] , "outputIndexes": [ 1758 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_609_output_0", "inputIndexes": [ 1758, 20 ] , "outputIndexes": [ 1759 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_247_output_0", "inputIndexes": [ 1751, 1759, 30, 31 ] , "outputIndexes": [ 1760 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_172_output_0", "inputIndexes": [ 1739, 1760 ] , "outputIndexes": [ 1761 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_152_output_0", "inputIndexes": [ 1761, 58 ] , "outputIndexes": [ 1762 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_268_output_0", "inputIndexes": [ 1761 ] , "outputIndexes": [ 1763 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7289", "inputIndexes": [ 1763 ] , "outputIndexes": [ 1764 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7291", "inputIndexes": [ 1763 ] , "outputIndexes": [ 1765 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7293", "inputIndexes": [ 1765, 1765 ] , "outputIndexes": [ 1766 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7294", "inputIndexes": [ 1766 ] , "outputIndexes": [ 1767 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7296", "inputIndexes": [ 1766, 12 ] , "outputIndexes": [ 1768 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7297", "inputIndexes": [ 1768 ] , "outputIndexes": [ 1769 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7300", "inputIndexes": [ 1764, 1767, 1769, 15 ] , "outputIndexes": [ 1770 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7301", "inputIndexes": [ 1770 ] , "outputIndexes": [ 1771 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7302", "inputIndexes": [ 61, 1771 ] , "outputIndexes": [ 1772 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7303", "inputIndexes": [ 1772, 1771 ] , "outputIndexes": [ 1773 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_290_output_0", "inputIndexes": [ 1763, 1773, 1766 ] , "outputIndexes": [ 1774 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_57_output_0", "inputIndexes": [ 1774, 73 ] , "outputIndexes": [ 1775 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_615_output_0", "inputIndexes": [ 1775, 20 ] , "outputIndexes": [ 1776 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_77_output_0", "inputIndexes": [ 1761, 1776, 76, 77, 15 ] , "outputIndexes": [ 1777 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_38_output_0", "inputIndexes": [ 1777 ] , "outputIndexes": [ 1778 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_614_output_0", "inputIndexes": [ 1775, 20 ] , "outputIndexes": [ 1779 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_76_output_0", "inputIndexes": [ 1761, 20, 1779, 77, 15 ] , "outputIndexes": [ 1780 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_250_output_0", "inputIndexes": [ 1778, 1780 ] , "outputIndexes": [ 1781 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_153_output_0", "inputIndexes": [ 1781, 89 ] , "outputIndexes": [ 1782 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_95_output_0", "inputIndexes": [ 1762, 1782 ] , "outputIndexes": [ 1783 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/self_attn/k_proj/Linear", "inputIndexes": [ 3253 ] , "outputIndexes": [ 3258 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75182372, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3258 ] , "outputIndexes": [ 3259 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3259 ] , "outputIndexes": [ 1784 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_610_output_0", "inputIndexes": [ 1750, 20 ] , "outputIndexes": [ 1785 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_611_output_0", "inputIndexes": [ 1758, 20 ] , "outputIndexes": [ 1786 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_248_output_0", "inputIndexes": [ 1785, 1786, 77, 31 ] , "outputIndexes": [ 1787 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_173_output_0", "inputIndexes": [ 1784, 1787 ] , "outputIndexes": [ 1788 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_154_output_0", "inputIndexes": [ 1788, 58 ] , "outputIndexes": [ 1789 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_269_output_0", "inputIndexes": [ 1788 ] , "outputIndexes": [ 1790 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7195", "inputIndexes": [ 1790 ] , "outputIndexes": [ 1791 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7197", "inputIndexes": [ 1790 ] , "outputIndexes": [ 1792 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7199", "inputIndexes": [ 1792, 1792 ] , "outputIndexes": [ 1793 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7200", "inputIndexes": [ 1793 ] , "outputIndexes": [ 1794 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7202", "inputIndexes": [ 1793, 12 ] , "outputIndexes": [ 1795 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7203", "inputIndexes": [ 1795 ] , "outputIndexes": [ 1796 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7206", "inputIndexes": [ 1791, 1794, 1796, 15 ] , "outputIndexes": [ 1797 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7207", "inputIndexes": [ 1797 ] , "outputIndexes": [ 1798 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7208", "inputIndexes": [ 61, 1798 ] , "outputIndexes": [ 1799 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7209", "inputIndexes": [ 1799, 1798 ] , "outputIndexes": [ 1800 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_291_output_0", "inputIndexes": [ 1790, 1800, 1793 ] , "outputIndexes": [ 1801 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_58_output_0", "inputIndexes": [ 1801, 73 ] , "outputIndexes": [ 1802 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_617_output_0", "inputIndexes": [ 1802, 20 ] , "outputIndexes": [ 1803 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_79_output_0", "inputIndexes": [ 1788, 1803, 76, 77, 15 ] , "outputIndexes": [ 1804 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_39_output_0", "inputIndexes": [ 1804 ] , "outputIndexes": [ 1805 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_616_output_0", "inputIndexes": [ 1802, 20 ] , "outputIndexes": [ 1806 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_78_output_0", "inputIndexes": [ 1788, 20, 1806, 77, 15 ] , "outputIndexes": [ 1807 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_251_output_0", "inputIndexes": [ 1805, 1807 ] , "outputIndexes": [ 1808 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_155_output_0", "inputIndexes": [ 1808, 89 ] , "outputIndexes": [ 1809 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_96_output_0", "inputIndexes": [ 1789, 1809 ] , "outputIndexes": [ 1810 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/self_attn/v_proj/Linear", "inputIndexes": [ 3253 ] , "outputIndexes": [ 3262 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75307050, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3262 ] , "outputIndexes": [ 3263 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3263 ] , "outputIndexes": [ 1811 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_612_output_0", "inputIndexes": [ 1750, 20 ] , "outputIndexes": [ 1812 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_613_output_0", "inputIndexes": [ 1758, 20 ] , "outputIndexes": [ 1813 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_249_output_0", "inputIndexes": [ 1812, 1813, 77, 31 ] , "outputIndexes": [ 1814 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_174_output_0", "inputIndexes": [ 1811, 1814 ] , "outputIndexes": [ 1815 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_179_output_0", "inputIndexes": [ 1783, 1810, 1815, 124 ] , "outputIndexes": [ 1816 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1816 ] , "outputIndexes": [ 3264 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3264 ] , "outputIndexes": [ 3265 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/self_attn/o_proj/Linear", "inputIndexes": [ 3265 ] , "outputIndexes": [ 3266 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75431728, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3266 ] , "outputIndexes": [ 3267 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3267 ] , "outputIndexes": [ 1817 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_98_output_0", "inputIndexes": [ 1737, 1817 ] , "outputIndexes": [ 1818 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_19/Mul_1_output_0", "inputIndexes": [ 1818 ] , "outputIndexes": [ 1819 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 75805238, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1819 ] , "outputIndexes": [ 3268 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3268 ] , "outputIndexes": [ 3269 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/mlp/gate_proj/Linear", "inputIndexes": [ 3269 ] , "outputIndexes": [ 3270 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75809846, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3270 ] , "outputIndexes": [ 3271 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3271 ] , "outputIndexes": [ 1820 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_19/Mul_output_0", "inputIndexes": [ 1820 ] , "outputIndexes": [ 1821 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/mlp/up_proj/Linear", "inputIndexes": [ 3269 ] , "outputIndexes": [ 3274 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 76805436, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3274 ] , "outputIndexes": [ 3275 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3275 ] , "outputIndexes": [ 1822 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_19/Mul_output_0", "inputIndexes": [ 1821, 1822 ] , "outputIndexes": [ 1823 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1823 ] , "outputIndexes": [ 3276 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3276 ] , "outputIndexes": [ 3277 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.19/mlp/down_proj/Linear", "inputIndexes": [ 3277 ] , "outputIndexes": [ 3278 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 77801026, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.19/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3278 ] , "outputIndexes": [ 3279 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3279 ] , "outputIndexes": [ 1824 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_99_output_0", "inputIndexes": [ 1818, 1824 ] , "outputIndexes": [ 1825 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_180_output_0", "inputIndexes": [ 1825, 3 ] , "outputIndexes": [ 1826 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_20/Mul_1_output_0", "inputIndexes": [ 1826 ] , "outputIndexes": [ 1827 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 78741320, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1827 ] , "outputIndexes": [ 3280 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3280 ] , "outputIndexes": [ 3281 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/self_attn/q_proj/Linear", "inputIndexes": [ 3281 ] , "outputIndexes": [ 3282 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 78745928, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3282 ] , "outputIndexes": [ 3283 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3283 ] , "outputIndexes": [ 1828 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_280_output_0", "inputIndexes": [ 1827 ] , "outputIndexes": [ 1829 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7528", "inputIndexes": [ 1829 ] , "outputIndexes": [ 1830 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7530", "inputIndexes": [ 1829 ] , "outputIndexes": [ 1831 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7532", "inputIndexes": [ 1831, 1831 ] , "outputIndexes": [ 1832 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7533", "inputIndexes": [ 1832 ] , "outputIndexes": [ 1833 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7535", "inputIndexes": [ 1832, 12 ] , "outputIndexes": [ 1834 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7536", "inputIndexes": [ 1834 ] , "outputIndexes": [ 1835 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7539", "inputIndexes": [ 1830, 1833, 1835, 15 ] , "outputIndexes": [ 1836 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7540", "inputIndexes": [ 1836 ] , "outputIndexes": [ 1837 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7542", "inputIndexes": [ 1837, 1837 ] , "outputIndexes": [ 1838 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_303_output_0", "inputIndexes": [ 1829, 1838, 1832 ] , "outputIndexes": [ 1839 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_640_output_0", "inputIndexes": [ 1839, 20 ] , "outputIndexes": [ 1840 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7550", "inputIndexes": [ 1832 ] , "outputIndexes": [ 1841 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7553", "inputIndexes": [ 1834 ] , "outputIndexes": [ 1842 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7556", "inputIndexes": [ 1830, 1841, 1842, 15 ] , "outputIndexes": [ 1843 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7557", "inputIndexes": [ 1843 ] , "outputIndexes": [ 1844 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7558", "inputIndexes": [ 12, 1844 ] , "outputIndexes": [ 1845 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7559", "inputIndexes": [ 1845, 1844 ] , "outputIndexes": [ 1846 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_304_output_0", "inputIndexes": [ 1829, 1846, 1832 ] , "outputIndexes": [ 1847 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_641_output_0", "inputIndexes": [ 1847, 20 ] , "outputIndexes": [ 1848 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_260_output_0", "inputIndexes": [ 1840, 1848, 30, 31 ] , "outputIndexes": [ 1849 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_181_output_0", "inputIndexes": [ 1828, 1849 ] , "outputIndexes": [ 1850 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_160_output_0", "inputIndexes": [ 1850, 58 ] , "outputIndexes": [ 1851 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_282_output_0", "inputIndexes": [ 1850 ] , "outputIndexes": [ 1852 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7660", "inputIndexes": [ 1852 ] , "outputIndexes": [ 1853 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7662", "inputIndexes": [ 1852 ] , "outputIndexes": [ 1854 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7664", "inputIndexes": [ 1854, 1854 ] , "outputIndexes": [ 1855 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7665", "inputIndexes": [ 1855 ] , "outputIndexes": [ 1856 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7667", "inputIndexes": [ 1855, 12 ] , "outputIndexes": [ 1857 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7668", "inputIndexes": [ 1857 ] , "outputIndexes": [ 1858 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7671", "inputIndexes": [ 1853, 1856, 1858, 15 ] , "outputIndexes": [ 1859 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7672", "inputIndexes": [ 1859 ] , "outputIndexes": [ 1860 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7673", "inputIndexes": [ 61, 1860 ] , "outputIndexes": [ 1861 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7674", "inputIndexes": [ 1861, 1860 ] , "outputIndexes": [ 1862 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_305_output_0", "inputIndexes": [ 1852, 1862, 1855 ] , "outputIndexes": [ 1863 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_60_output_0", "inputIndexes": [ 1863, 73 ] , "outputIndexes": [ 1864 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_647_output_0", "inputIndexes": [ 1864, 20 ] , "outputIndexes": [ 1865 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_81_output_0", "inputIndexes": [ 1850, 1865, 76, 77, 15 ] , "outputIndexes": [ 1866 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_40_output_0", "inputIndexes": [ 1866 ] , "outputIndexes": [ 1867 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_646_output_0", "inputIndexes": [ 1864, 20 ] , "outputIndexes": [ 1868 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_80_output_0", "inputIndexes": [ 1850, 20, 1868, 77, 15 ] , "outputIndexes": [ 1869 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_263_output_0", "inputIndexes": [ 1867, 1869 ] , "outputIndexes": [ 1870 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_161_output_0", "inputIndexes": [ 1870, 89 ] , "outputIndexes": [ 1871 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_100_output_0", "inputIndexes": [ 1851, 1871 ] , "outputIndexes": [ 1872 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/self_attn/k_proj/Linear", "inputIndexes": [ 3281 ] , "outputIndexes": [ 3286 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79119438, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3286 ] , "outputIndexes": [ 3287 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3287 ] , "outputIndexes": [ 1873 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_642_output_0", "inputIndexes": [ 1839, 20 ] , "outputIndexes": [ 1874 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_643_output_0", "inputIndexes": [ 1847, 20 ] , "outputIndexes": [ 1875 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_261_output_0", "inputIndexes": [ 1874, 1875, 77, 31 ] , "outputIndexes": [ 1876 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_182_output_0", "inputIndexes": [ 1873, 1876 ] , "outputIndexes": [ 1877 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_162_output_0", "inputIndexes": [ 1877, 58 ] , "outputIndexes": [ 1878 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_283_output_0", "inputIndexes": [ 1877 ] , "outputIndexes": [ 1879 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7566", "inputIndexes": [ 1879 ] , "outputIndexes": [ 1880 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7568", "inputIndexes": [ 1879 ] , "outputIndexes": [ 1881 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7570", "inputIndexes": [ 1881, 1881 ] , "outputIndexes": [ 1882 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7571", "inputIndexes": [ 1882 ] , "outputIndexes": [ 1883 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7573", "inputIndexes": [ 1882, 12 ] , "outputIndexes": [ 1884 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7574", "inputIndexes": [ 1884 ] , "outputIndexes": [ 1885 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7577", "inputIndexes": [ 1880, 1883, 1885, 15 ] , "outputIndexes": [ 1886 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7578", "inputIndexes": [ 1886 ] , "outputIndexes": [ 1887 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7579", "inputIndexes": [ 61, 1887 ] , "outputIndexes": [ 1888 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7580", "inputIndexes": [ 1888, 1887 ] , "outputIndexes": [ 1889 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_306_output_0", "inputIndexes": [ 1879, 1889, 1882 ] , "outputIndexes": [ 1890 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_61_output_0", "inputIndexes": [ 1890, 73 ] , "outputIndexes": [ 1891 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_649_output_0", "inputIndexes": [ 1891, 20 ] , "outputIndexes": [ 1892 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_83_output_0", "inputIndexes": [ 1877, 1892, 76, 77, 15 ] , "outputIndexes": [ 1893 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_41_output_0", "inputIndexes": [ 1893 ] , "outputIndexes": [ 1894 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_648_output_0", "inputIndexes": [ 1891, 20 ] , "outputIndexes": [ 1895 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_82_output_0", "inputIndexes": [ 1877, 20, 1895, 77, 15 ] , "outputIndexes": [ 1896 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_264_output_0", "inputIndexes": [ 1894, 1896 ] , "outputIndexes": [ 1897 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_163_output_0", "inputIndexes": [ 1897, 89 ] , "outputIndexes": [ 1898 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_101_output_0", "inputIndexes": [ 1878, 1898 ] , "outputIndexes": [ 1899 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/self_attn/v_proj/Linear", "inputIndexes": [ 3281 ] , "outputIndexes": [ 3290 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79244116, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3290 ] , "outputIndexes": [ 3291 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3291 ] , "outputIndexes": [ 1900 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_644_output_0", "inputIndexes": [ 1839, 20 ] , "outputIndexes": [ 1901 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_645_output_0", "inputIndexes": [ 1847, 20 ] , "outputIndexes": [ 1902 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_262_output_0", "inputIndexes": [ 1901, 1902, 77, 31 ] , "outputIndexes": [ 1903 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_183_output_0", "inputIndexes": [ 1900, 1903 ] , "outputIndexes": [ 1904 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_188_output_0", "inputIndexes": [ 1872, 1899, 1904, 124 ] , "outputIndexes": [ 1905 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1905 ] , "outputIndexes": [ 3292 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3292 ] , "outputIndexes": [ 3293 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/self_attn/o_proj/Linear", "inputIndexes": [ 3293 ] , "outputIndexes": [ 3294 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79368794, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3294 ] , "outputIndexes": [ 3295 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3295 ] , "outputIndexes": [ 1906 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_103_output_0", "inputIndexes": [ 1826, 1906 ] , "outputIndexes": [ 1907 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_20/Mul_1_output_0", "inputIndexes": [ 1907 ] , "outputIndexes": [ 1908 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 79742304, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1908 ] , "outputIndexes": [ 3296 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3296 ] , "outputIndexes": [ 3297 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/mlp/gate_proj/Linear", "inputIndexes": [ 3297 ] , "outputIndexes": [ 3298 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 79746912, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3298 ] , "outputIndexes": [ 3299 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3299 ] , "outputIndexes": [ 1909 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_20/Mul_output_0", "inputIndexes": [ 1909 ] , "outputIndexes": [ 1910 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/mlp/up_proj/Linear", "inputIndexes": [ 3297 ] , "outputIndexes": [ 3302 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 80742502, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3302 ] , "outputIndexes": [ 3303 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3303 ] , "outputIndexes": [ 1911 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_20/Mul_output_0", "inputIndexes": [ 1910, 1911 ] , "outputIndexes": [ 1912 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 1912 ] , "outputIndexes": [ 3304 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3304 ] , "outputIndexes": [ 3305 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.20/mlp/down_proj/Linear", "inputIndexes": [ 3305 ] , "outputIndexes": [ 3306 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 81738092, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.20/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3306 ] , "outputIndexes": [ 3307 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3307 ] , "outputIndexes": [ 1913 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_104_output_0", "inputIndexes": [ 1907, 1913 ] , "outputIndexes": [ 1914 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_189_output_0", "inputIndexes": [ 1914, 3 ] , "outputIndexes": [ 1915 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_21/Mul_1_output_0", "inputIndexes": [ 1915 ] , "outputIndexes": [ 1916 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 82678386, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 1916 ] , "outputIndexes": [ 3308 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3308 ] , "outputIndexes": [ 3309 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/self_attn/q_proj/Linear", "inputIndexes": [ 3309 ] , "outputIndexes": [ 3310 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 82682994, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3310 ] , "outputIndexes": [ 3311 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3311 ] , "outputIndexes": [ 1917 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_294_output_0", "inputIndexes": [ 1916 ] , "outputIndexes": [ 1918 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7899", "inputIndexes": [ 1918 ] , "outputIndexes": [ 1919 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7901", "inputIndexes": [ 1918 ] , "outputIndexes": [ 1920 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7903", "inputIndexes": [ 1920, 1920 ] , "outputIndexes": [ 1921 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7904", "inputIndexes": [ 1921 ] , "outputIndexes": [ 1922 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7906", "inputIndexes": [ 1921, 12 ] , "outputIndexes": [ 1923 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7907", "inputIndexes": [ 1923 ] , "outputIndexes": [ 1924 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7910", "inputIndexes": [ 1919, 1922, 1924, 15 ] , "outputIndexes": [ 1925 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7911", "inputIndexes": [ 1925 ] , "outputIndexes": [ 1926 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7913", "inputIndexes": [ 1926, 1926 ] , "outputIndexes": [ 1927 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_318_output_0", "inputIndexes": [ 1918, 1927, 1921 ] , "outputIndexes": [ 1928 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_672_output_0", "inputIndexes": [ 1928, 20 ] , "outputIndexes": [ 1929 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7921", "inputIndexes": [ 1921 ] , "outputIndexes": [ 1930 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7924", "inputIndexes": [ 1923 ] , "outputIndexes": [ 1931 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7927", "inputIndexes": [ 1919, 1930, 1931, 15 ] , "outputIndexes": [ 1932 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7928", "inputIndexes": [ 1932 ] , "outputIndexes": [ 1933 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7929", "inputIndexes": [ 12, 1933 ] , "outputIndexes": [ 1934 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7930", "inputIndexes": [ 1934, 1933 ] , "outputIndexes": [ 1935 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_319_output_0", "inputIndexes": [ 1918, 1935, 1921 ] , "outputIndexes": [ 1936 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_673_output_0", "inputIndexes": [ 1936, 20 ] , "outputIndexes": [ 1937 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_273_output_0", "inputIndexes": [ 1929, 1937, 30, 31 ] , "outputIndexes": [ 1938 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_190_output_0", "inputIndexes": [ 1917, 1938 ] , "outputIndexes": [ 1939 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_168_output_0", "inputIndexes": [ 1939, 58 ] , "outputIndexes": [ 1940 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_296_output_0", "inputIndexes": [ 1939 ] , "outputIndexes": [ 1941 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8031", "inputIndexes": [ 1941 ] , "outputIndexes": [ 1942 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8033", "inputIndexes": [ 1941 ] , "outputIndexes": [ 1943 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8035", "inputIndexes": [ 1943, 1943 ] , "outputIndexes": [ 1944 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8036", "inputIndexes": [ 1944 ] , "outputIndexes": [ 1945 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8038", "inputIndexes": [ 1944, 12 ] , "outputIndexes": [ 1946 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8039", "inputIndexes": [ 1946 ] , "outputIndexes": [ 1947 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8042", "inputIndexes": [ 1942, 1945, 1947, 15 ] , "outputIndexes": [ 1948 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8043", "inputIndexes": [ 1948 ] , "outputIndexes": [ 1949 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8044", "inputIndexes": [ 61, 1949 ] , "outputIndexes": [ 1950 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8045", "inputIndexes": [ 1950, 1949 ] , "outputIndexes": [ 1951 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_320_output_0", "inputIndexes": [ 1941, 1951, 1944 ] , "outputIndexes": [ 1952 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_63_output_0", "inputIndexes": [ 1952, 73 ] , "outputIndexes": [ 1953 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_679_output_0", "inputIndexes": [ 1953, 20 ] , "outputIndexes": [ 1954 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_85_output_0", "inputIndexes": [ 1939, 1954, 76, 77, 15 ] , "outputIndexes": [ 1955 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_42_output_0", "inputIndexes": [ 1955 ] , "outputIndexes": [ 1956 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_678_output_0", "inputIndexes": [ 1953, 20 ] , "outputIndexes": [ 1957 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_84_output_0", "inputIndexes": [ 1939, 20, 1957, 77, 15 ] , "outputIndexes": [ 1958 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_276_output_0", "inputIndexes": [ 1956, 1958 ] , "outputIndexes": [ 1959 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_169_output_0", "inputIndexes": [ 1959, 89 ] , "outputIndexes": [ 1960 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_105_output_0", "inputIndexes": [ 1940, 1960 ] , "outputIndexes": [ 1961 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/self_attn/k_proj/Linear", "inputIndexes": [ 3309 ] , "outputIndexes": [ 3314 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 83056504, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3314 ] , "outputIndexes": [ 3315 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3315 ] , "outputIndexes": [ 1962 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_674_output_0", "inputIndexes": [ 1928, 20 ] , "outputIndexes": [ 1963 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_675_output_0", "inputIndexes": [ 1936, 20 ] , "outputIndexes": [ 1964 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_274_output_0", "inputIndexes": [ 1963, 1964, 77, 31 ] , "outputIndexes": [ 1965 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_191_output_0", "inputIndexes": [ 1962, 1965 ] , "outputIndexes": [ 1966 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_170_output_0", "inputIndexes": [ 1966, 58 ] , "outputIndexes": [ 1967 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_297_output_0", "inputIndexes": [ 1966 ] , "outputIndexes": [ 1968 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape7937", "inputIndexes": [ 1968 ] , "outputIndexes": [ 1969 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank7939", "inputIndexes": [ 1968 ] , "outputIndexes": [ 1970 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7941", "inputIndexes": [ 1970, 1970 ] , "outputIndexes": [ 1971 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7942", "inputIndexes": [ 1971 ] , "outputIndexes": [ 1972 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7944", "inputIndexes": [ 1971, 12 ] , "outputIndexes": [ 1973 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze7945", "inputIndexes": [ 1973 ] , "outputIndexes": [ 1974 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice7948", "inputIndexes": [ 1969, 1972, 1974, 15 ] , "outputIndexes": [ 1975 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze7949", "inputIndexes": [ 1975 ] , "outputIndexes": [ 1976 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7950", "inputIndexes": [ 61, 1976 ] , "outputIndexes": [ 1977 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp7951", "inputIndexes": [ 1977, 1976 ] , "outputIndexes": [ 1978 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_321_output_0", "inputIndexes": [ 1968, 1978, 1971 ] , "outputIndexes": [ 1979 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_64_output_0", "inputIndexes": [ 1979, 73 ] , "outputIndexes": [ 1980 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_681_output_0", "inputIndexes": [ 1980, 20 ] , "outputIndexes": [ 1981 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_87_output_0", "inputIndexes": [ 1966, 1981, 76, 77, 15 ] , "outputIndexes": [ 1982 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_43_output_0", "inputIndexes": [ 1982 ] , "outputIndexes": [ 1983 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_680_output_0", "inputIndexes": [ 1980, 20 ] , "outputIndexes": [ 1984 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_86_output_0", "inputIndexes": [ 1966, 20, 1984, 77, 15 ] , "outputIndexes": [ 1985 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_277_output_0", "inputIndexes": [ 1983, 1985 ] , "outputIndexes": [ 1986 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_171_output_0", "inputIndexes": [ 1986, 89 ] , "outputIndexes": [ 1987 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_106_output_0", "inputIndexes": [ 1967, 1987 ] , "outputIndexes": [ 1988 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/self_attn/v_proj/Linear", "inputIndexes": [ 3309 ] , "outputIndexes": [ 3318 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 83181182, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3318 ] , "outputIndexes": [ 3319 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3319 ] , "outputIndexes": [ 1989 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_676_output_0", "inputIndexes": [ 1928, 20 ] , "outputIndexes": [ 1990 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_677_output_0", "inputIndexes": [ 1936, 20 ] , "outputIndexes": [ 1991 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_275_output_0", "inputIndexes": [ 1990, 1991, 77, 31 ] , "outputIndexes": [ 1992 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_192_output_0", "inputIndexes": [ 1989, 1992 ] , "outputIndexes": [ 1993 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_197_output_0", "inputIndexes": [ 1961, 1988, 1993, 124 ] , "outputIndexes": [ 1994 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 1994 ] , "outputIndexes": [ 3320 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3320 ] , "outputIndexes": [ 3321 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/self_attn/o_proj/Linear", "inputIndexes": [ 3321 ] , "outputIndexes": [ 3322 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 83305860, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3322 ] , "outputIndexes": [ 3323 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3323 ] , "outputIndexes": [ 1995 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_108_output_0", "inputIndexes": [ 1915, 1995 ] , "outputIndexes": [ 1996 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_21/Mul_1_output_0", "inputIndexes": [ 1996 ] , "outputIndexes": [ 1997 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 83679370, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 1997 ] , "outputIndexes": [ 3324 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3324 ] , "outputIndexes": [ 3325 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/mlp/gate_proj/Linear", "inputIndexes": [ 3325 ] , "outputIndexes": [ 3326 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 83683978, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3326 ] , "outputIndexes": [ 3327 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3327 ] , "outputIndexes": [ 1998 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_21/Mul_output_0", "inputIndexes": [ 1998 ] , "outputIndexes": [ 1999 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/mlp/up_proj/Linear", "inputIndexes": [ 3325 ] , "outputIndexes": [ 3330 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 84679568, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3330 ] , "outputIndexes": [ 3331 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3331 ] , "outputIndexes": [ 2000 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_21/Mul_output_0", "inputIndexes": [ 1999, 2000 ] , "outputIndexes": [ 2001 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2001 ] , "outputIndexes": [ 3332 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3332 ] , "outputIndexes": [ 3333 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.21/mlp/down_proj/Linear", "inputIndexes": [ 3333 ] , "outputIndexes": [ 3334 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 85675158, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.21/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3334 ] , "outputIndexes": [ 3335 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3335 ] , "outputIndexes": [ 2002 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_109_output_0", "inputIndexes": [ 1996, 2002 ] , "outputIndexes": [ 2003 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_198_output_0", "inputIndexes": [ 2003, 3 ] , "outputIndexes": [ 2004 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_22/Mul_1_output_0", "inputIndexes": [ 2004 ] , "outputIndexes": [ 2005 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 86615452, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2005 ] , "outputIndexes": [ 3336 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3336 ] , "outputIndexes": [ 3337 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/self_attn/q_proj/Linear", "inputIndexes": [ 3337 ] , "outputIndexes": [ 3338 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 86620060, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3338 ] , "outputIndexes": [ 3339 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3339 ] , "outputIndexes": [ 2006 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_308_output_0", "inputIndexes": [ 2005 ] , "outputIndexes": [ 2007 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8270", "inputIndexes": [ 2007 ] , "outputIndexes": [ 2008 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8272", "inputIndexes": [ 2007 ] , "outputIndexes": [ 2009 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8274", "inputIndexes": [ 2009, 2009 ] , "outputIndexes": [ 2010 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8275", "inputIndexes": [ 2010 ] , "outputIndexes": [ 2011 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8277", "inputIndexes": [ 2010, 12 ] , "outputIndexes": [ 2012 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8278", "inputIndexes": [ 2012 ] , "outputIndexes": [ 2013 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8281", "inputIndexes": [ 2008, 2011, 2013, 15 ] , "outputIndexes": [ 2014 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8282", "inputIndexes": [ 2014 ] , "outputIndexes": [ 2015 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8284", "inputIndexes": [ 2015, 2015 ] , "outputIndexes": [ 2016 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_333_output_0", "inputIndexes": [ 2007, 2016, 2010 ] , "outputIndexes": [ 2017 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_704_output_0", "inputIndexes": [ 2017, 20 ] , "outputIndexes": [ 2018 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8292", "inputIndexes": [ 2010 ] , "outputIndexes": [ 2019 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8295", "inputIndexes": [ 2012 ] , "outputIndexes": [ 2020 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8298", "inputIndexes": [ 2008, 2019, 2020, 15 ] , "outputIndexes": [ 2021 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8299", "inputIndexes": [ 2021 ] , "outputIndexes": [ 2022 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8300", "inputIndexes": [ 12, 2022 ] , "outputIndexes": [ 2023 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8301", "inputIndexes": [ 2023, 2022 ] , "outputIndexes": [ 2024 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_334_output_0", "inputIndexes": [ 2007, 2024, 2010 ] , "outputIndexes": [ 2025 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_705_output_0", "inputIndexes": [ 2025, 20 ] , "outputIndexes": [ 2026 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_286_output_0", "inputIndexes": [ 2018, 2026, 30, 31 ] , "outputIndexes": [ 2027 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_199_output_0", "inputIndexes": [ 2006, 2027 ] , "outputIndexes": [ 2028 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_176_output_0", "inputIndexes": [ 2028, 58 ] , "outputIndexes": [ 2029 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_310_output_0", "inputIndexes": [ 2028 ] , "outputIndexes": [ 2030 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8402", "inputIndexes": [ 2030 ] , "outputIndexes": [ 2031 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8404", "inputIndexes": [ 2030 ] , "outputIndexes": [ 2032 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8406", "inputIndexes": [ 2032, 2032 ] , "outputIndexes": [ 2033 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8407", "inputIndexes": [ 2033 ] , "outputIndexes": [ 2034 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8409", "inputIndexes": [ 2033, 12 ] , "outputIndexes": [ 2035 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8410", "inputIndexes": [ 2035 ] , "outputIndexes": [ 2036 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8413", "inputIndexes": [ 2031, 2034, 2036, 15 ] , "outputIndexes": [ 2037 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8414", "inputIndexes": [ 2037 ] , "outputIndexes": [ 2038 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8415", "inputIndexes": [ 61, 2038 ] , "outputIndexes": [ 2039 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8416", "inputIndexes": [ 2039, 2038 ] , "outputIndexes": [ 2040 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_335_output_0", "inputIndexes": [ 2030, 2040, 2033 ] , "outputIndexes": [ 2041 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_66_output_0", "inputIndexes": [ 2041, 73 ] , "outputIndexes": [ 2042 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_711_output_0", "inputIndexes": [ 2042, 20 ] , "outputIndexes": [ 2043 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_89_output_0", "inputIndexes": [ 2028, 2043, 76, 77, 15 ] , "outputIndexes": [ 2044 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_44_output_0", "inputIndexes": [ 2044 ] , "outputIndexes": [ 2045 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_710_output_0", "inputIndexes": [ 2042, 20 ] , "outputIndexes": [ 2046 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_88_output_0", "inputIndexes": [ 2028, 20, 2046, 77, 15 ] , "outputIndexes": [ 2047 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_289_output_0", "inputIndexes": [ 2045, 2047 ] , "outputIndexes": [ 2048 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_177_output_0", "inputIndexes": [ 2048, 89 ] , "outputIndexes": [ 2049 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_110_output_0", "inputIndexes": [ 2029, 2049 ] , "outputIndexes": [ 2050 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/self_attn/k_proj/Linear", "inputIndexes": [ 3337 ] , "outputIndexes": [ 3342 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 86993570, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3342 ] , "outputIndexes": [ 3343 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3343 ] , "outputIndexes": [ 2051 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_706_output_0", "inputIndexes": [ 2017, 20 ] , "outputIndexes": [ 2052 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_707_output_0", "inputIndexes": [ 2025, 20 ] , "outputIndexes": [ 2053 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_287_output_0", "inputIndexes": [ 2052, 2053, 77, 31 ] , "outputIndexes": [ 2054 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_200_output_0", "inputIndexes": [ 2051, 2054 ] , "outputIndexes": [ 2055 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_178_output_0", "inputIndexes": [ 2055, 58 ] , "outputIndexes": [ 2056 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_311_output_0", "inputIndexes": [ 2055 ] , "outputIndexes": [ 2057 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8308", "inputIndexes": [ 2057 ] , "outputIndexes": [ 2058 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8310", "inputIndexes": [ 2057 ] , "outputIndexes": [ 2059 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8312", "inputIndexes": [ 2059, 2059 ] , "outputIndexes": [ 2060 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8313", "inputIndexes": [ 2060 ] , "outputIndexes": [ 2061 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8315", "inputIndexes": [ 2060, 12 ] , "outputIndexes": [ 2062 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8316", "inputIndexes": [ 2062 ] , "outputIndexes": [ 2063 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8319", "inputIndexes": [ 2058, 2061, 2063, 15 ] , "outputIndexes": [ 2064 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8320", "inputIndexes": [ 2064 ] , "outputIndexes": [ 2065 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8321", "inputIndexes": [ 61, 2065 ] , "outputIndexes": [ 2066 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8322", "inputIndexes": [ 2066, 2065 ] , "outputIndexes": [ 2067 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_336_output_0", "inputIndexes": [ 2057, 2067, 2060 ] , "outputIndexes": [ 2068 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_67_output_0", "inputIndexes": [ 2068, 73 ] , "outputIndexes": [ 2069 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_713_output_0", "inputIndexes": [ 2069, 20 ] , "outputIndexes": [ 2070 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_91_output_0", "inputIndexes": [ 2055, 2070, 76, 77, 15 ] , "outputIndexes": [ 2071 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_45_output_0", "inputIndexes": [ 2071 ] , "outputIndexes": [ 2072 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_712_output_0", "inputIndexes": [ 2069, 20 ] , "outputIndexes": [ 2073 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_90_output_0", "inputIndexes": [ 2055, 20, 2073, 77, 15 ] , "outputIndexes": [ 2074 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_290_output_0", "inputIndexes": [ 2072, 2074 ] , "outputIndexes": [ 2075 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_179_output_0", "inputIndexes": [ 2075, 89 ] , "outputIndexes": [ 2076 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_111_output_0", "inputIndexes": [ 2056, 2076 ] , "outputIndexes": [ 2077 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/self_attn/v_proj/Linear", "inputIndexes": [ 3337 ] , "outputIndexes": [ 3346 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 87118248, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3346 ] , "outputIndexes": [ 3347 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3347 ] , "outputIndexes": [ 2078 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_708_output_0", "inputIndexes": [ 2017, 20 ] , "outputIndexes": [ 2079 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_709_output_0", "inputIndexes": [ 2025, 20 ] , "outputIndexes": [ 2080 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_288_output_0", "inputIndexes": [ 2079, 2080, 77, 31 ] , "outputIndexes": [ 2081 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_201_output_0", "inputIndexes": [ 2078, 2081 ] , "outputIndexes": [ 2082 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_206_output_0", "inputIndexes": [ 2050, 2077, 2082, 124 ] , "outputIndexes": [ 2083 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2083 ] , "outputIndexes": [ 3348 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3348 ] , "outputIndexes": [ 3349 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/self_attn/o_proj/Linear", "inputIndexes": [ 3349 ] , "outputIndexes": [ 3350 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 87242926, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3350 ] , "outputIndexes": [ 3351 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3351 ] , "outputIndexes": [ 2084 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_113_output_0", "inputIndexes": [ 2004, 2084 ] , "outputIndexes": [ 2085 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_22/Mul_1_output_0", "inputIndexes": [ 2085 ] , "outputIndexes": [ 2086 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 87616436, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2086 ] , "outputIndexes": [ 3352 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3352 ] , "outputIndexes": [ 3353 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/mlp/gate_proj/Linear", "inputIndexes": [ 3353 ] , "outputIndexes": [ 3354 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 87621044, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3354 ] , "outputIndexes": [ 3355 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3355 ] , "outputIndexes": [ 2087 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_22/Mul_output_0", "inputIndexes": [ 2087 ] , "outputIndexes": [ 2088 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/mlp/up_proj/Linear", "inputIndexes": [ 3353 ] , "outputIndexes": [ 3358 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 88616634, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3358 ] , "outputIndexes": [ 3359 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3359 ] , "outputIndexes": [ 2089 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_22/Mul_output_0", "inputIndexes": [ 2088, 2089 ] , "outputIndexes": [ 2090 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2090 ] , "outputIndexes": [ 3360 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3360 ] , "outputIndexes": [ 3361 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.22/mlp/down_proj/Linear", "inputIndexes": [ 3361 ] , "outputIndexes": [ 3362 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 89612224, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.22/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3362 ] , "outputIndexes": [ 3363 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3363 ] , "outputIndexes": [ 2091 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_114_output_0", "inputIndexes": [ 2085, 2091 ] , "outputIndexes": [ 2092 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_207_output_0", "inputIndexes": [ 2092, 3 ] , "outputIndexes": [ 2093 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_23/Mul_1_output_0", "inputIndexes": [ 2093 ] , "outputIndexes": [ 2094 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 90552518, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2094 ] , "outputIndexes": [ 3364 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3364 ] , "outputIndexes": [ 3365 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/self_attn/q_proj/Linear", "inputIndexes": [ 3365 ] , "outputIndexes": [ 3366 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 90557126, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3366 ] , "outputIndexes": [ 3367 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3367 ] , "outputIndexes": [ 2095 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_322_output_0", "inputIndexes": [ 2094 ] , "outputIndexes": [ 2096 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8641", "inputIndexes": [ 2096 ] , "outputIndexes": [ 2097 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8643", "inputIndexes": [ 2096 ] , "outputIndexes": [ 2098 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8645", "inputIndexes": [ 2098, 2098 ] , "outputIndexes": [ 2099 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8646", "inputIndexes": [ 2099 ] , "outputIndexes": [ 2100 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8648", "inputIndexes": [ 2099, 12 ] , "outputIndexes": [ 2101 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8649", "inputIndexes": [ 2101 ] , "outputIndexes": [ 2102 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8652", "inputIndexes": [ 2097, 2100, 2102, 15 ] , "outputIndexes": [ 2103 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8653", "inputIndexes": [ 2103 ] , "outputIndexes": [ 2104 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8655", "inputIndexes": [ 2104, 2104 ] , "outputIndexes": [ 2105 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_348_output_0", "inputIndexes": [ 2096, 2105, 2099 ] , "outputIndexes": [ 2106 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_736_output_0", "inputIndexes": [ 2106, 20 ] , "outputIndexes": [ 2107 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8663", "inputIndexes": [ 2099 ] , "outputIndexes": [ 2108 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8666", "inputIndexes": [ 2101 ] , "outputIndexes": [ 2109 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8669", "inputIndexes": [ 2097, 2108, 2109, 15 ] , "outputIndexes": [ 2110 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8670", "inputIndexes": [ 2110 ] , "outputIndexes": [ 2111 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8671", "inputIndexes": [ 12, 2111 ] , "outputIndexes": [ 2112 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8672", "inputIndexes": [ 2112, 2111 ] , "outputIndexes": [ 2113 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_349_output_0", "inputIndexes": [ 2096, 2113, 2099 ] , "outputIndexes": [ 2114 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_737_output_0", "inputIndexes": [ 2114, 20 ] , "outputIndexes": [ 2115 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_299_output_0", "inputIndexes": [ 2107, 2115, 30, 31 ] , "outputIndexes": [ 2116 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_208_output_0", "inputIndexes": [ 2095, 2116 ] , "outputIndexes": [ 2117 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_184_output_0", "inputIndexes": [ 2117, 58 ] , "outputIndexes": [ 2118 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_324_output_0", "inputIndexes": [ 2117 ] , "outputIndexes": [ 2119 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8773", "inputIndexes": [ 2119 ] , "outputIndexes": [ 2120 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8775", "inputIndexes": [ 2119 ] , "outputIndexes": [ 2121 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8777", "inputIndexes": [ 2121, 2121 ] , "outputIndexes": [ 2122 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8778", "inputIndexes": [ 2122 ] , "outputIndexes": [ 2123 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8780", "inputIndexes": [ 2122, 12 ] , "outputIndexes": [ 2124 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8781", "inputIndexes": [ 2124 ] , "outputIndexes": [ 2125 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8784", "inputIndexes": [ 2120, 2123, 2125, 15 ] , "outputIndexes": [ 2126 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8785", "inputIndexes": [ 2126 ] , "outputIndexes": [ 2127 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8786", "inputIndexes": [ 61, 2127 ] , "outputIndexes": [ 2128 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8787", "inputIndexes": [ 2128, 2127 ] , "outputIndexes": [ 2129 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_350_output_0", "inputIndexes": [ 2119, 2129, 2122 ] , "outputIndexes": [ 2130 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_69_output_0", "inputIndexes": [ 2130, 73 ] , "outputIndexes": [ 2131 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_743_output_0", "inputIndexes": [ 2131, 20 ] , "outputIndexes": [ 2132 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_93_output_0", "inputIndexes": [ 2117, 2132, 76, 77, 15 ] , "outputIndexes": [ 2133 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_46_output_0", "inputIndexes": [ 2133 ] , "outputIndexes": [ 2134 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_742_output_0", "inputIndexes": [ 2131, 20 ] , "outputIndexes": [ 2135 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_92_output_0", "inputIndexes": [ 2117, 20, 2135, 77, 15 ] , "outputIndexes": [ 2136 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_302_output_0", "inputIndexes": [ 2134, 2136 ] , "outputIndexes": [ 2137 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_185_output_0", "inputIndexes": [ 2137, 89 ] , "outputIndexes": [ 2138 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_115_output_0", "inputIndexes": [ 2118, 2138 ] , "outputIndexes": [ 2139 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/self_attn/k_proj/Linear", "inputIndexes": [ 3365 ] , "outputIndexes": [ 3370 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 90930636, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3370 ] , "outputIndexes": [ 3371 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3371 ] , "outputIndexes": [ 2140 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_738_output_0", "inputIndexes": [ 2106, 20 ] , "outputIndexes": [ 2141 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_739_output_0", "inputIndexes": [ 2114, 20 ] , "outputIndexes": [ 2142 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_300_output_0", "inputIndexes": [ 2141, 2142, 77, 31 ] , "outputIndexes": [ 2143 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_209_output_0", "inputIndexes": [ 2140, 2143 ] , "outputIndexes": [ 2144 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_186_output_0", "inputIndexes": [ 2144, 58 ] , "outputIndexes": [ 2145 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_325_output_0", "inputIndexes": [ 2144 ] , "outputIndexes": [ 2146 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape8679", "inputIndexes": [ 2146 ] , "outputIndexes": [ 2147 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank8681", "inputIndexes": [ 2146 ] , "outputIndexes": [ 2148 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8683", "inputIndexes": [ 2148, 2148 ] , "outputIndexes": [ 2149 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8684", "inputIndexes": [ 2149 ] , "outputIndexes": [ 2150 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8686", "inputIndexes": [ 2149, 12 ] , "outputIndexes": [ 2151 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze8687", "inputIndexes": [ 2151 ] , "outputIndexes": [ 2152 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice8690", "inputIndexes": [ 2147, 2150, 2152, 15 ] , "outputIndexes": [ 2153 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze8691", "inputIndexes": [ 2153 ] , "outputIndexes": [ 2154 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8692", "inputIndexes": [ 61, 2154 ] , "outputIndexes": [ 2155 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp8693", "inputIndexes": [ 2155, 2154 ] , "outputIndexes": [ 2156 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_351_output_0", "inputIndexes": [ 2146, 2156, 2149 ] , "outputIndexes": [ 2157 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_70_output_0", "inputIndexes": [ 2157, 73 ] , "outputIndexes": [ 2158 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_745_output_0", "inputIndexes": [ 2158, 20 ] , "outputIndexes": [ 2159 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_95_output_0", "inputIndexes": [ 2144, 2159, 76, 77, 15 ] , "outputIndexes": [ 2160 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_47_output_0", "inputIndexes": [ 2160 ] , "outputIndexes": [ 2161 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_744_output_0", "inputIndexes": [ 2158, 20 ] , "outputIndexes": [ 2162 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_94_output_0", "inputIndexes": [ 2144, 20, 2162, 77, 15 ] , "outputIndexes": [ 2163 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_303_output_0", "inputIndexes": [ 2161, 2163 ] , "outputIndexes": [ 2164 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_187_output_0", "inputIndexes": [ 2164, 89 ] , "outputIndexes": [ 2165 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_116_output_0", "inputIndexes": [ 2145, 2165 ] , "outputIndexes": [ 2166 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/self_attn/v_proj/Linear", "inputIndexes": [ 3365 ] , "outputIndexes": [ 3374 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 91055314, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3374 ] , "outputIndexes": [ 3375 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3375 ] , "outputIndexes": [ 2167 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_740_output_0", "inputIndexes": [ 2106, 20 ] , "outputIndexes": [ 2168 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_741_output_0", "inputIndexes": [ 2114, 20 ] , "outputIndexes": [ 2169 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_301_output_0", "inputIndexes": [ 2168, 2169, 77, 31 ] , "outputIndexes": [ 2170 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_210_output_0", "inputIndexes": [ 2167, 2170 ] , "outputIndexes": [ 2171 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_215_output_0", "inputIndexes": [ 2139, 2166, 2171, 124 ] , "outputIndexes": [ 2172 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2172 ] , "outputIndexes": [ 3376 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3376 ] , "outputIndexes": [ 3377 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/self_attn/o_proj/Linear", "inputIndexes": [ 3377 ] , "outputIndexes": [ 3378 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 91179992, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3378 ] , "outputIndexes": [ 3379 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3379 ] , "outputIndexes": [ 2173 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_118_output_0", "inputIndexes": [ 2093, 2173 ] , "outputIndexes": [ 2174 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_23/Mul_1_output_0", "inputIndexes": [ 2174 ] , "outputIndexes": [ 2175 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 91553502, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2175 ] , "outputIndexes": [ 3380 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3380 ] , "outputIndexes": [ 3381 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/mlp/gate_proj/Linear", "inputIndexes": [ 3381 ] , "outputIndexes": [ 3382 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 91558110, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3382 ] , "outputIndexes": [ 3383 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3383 ] , "outputIndexes": [ 2176 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_23/Mul_output_0", "inputIndexes": [ 2176 ] , "outputIndexes": [ 2177 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/mlp/up_proj/Linear", "inputIndexes": [ 3381 ] , "outputIndexes": [ 3386 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 92553700, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3386 ] , "outputIndexes": [ 3387 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3387 ] , "outputIndexes": [ 2178 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_23/Mul_output_0", "inputIndexes": [ 2177, 2178 ] , "outputIndexes": [ 2179 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2179 ] , "outputIndexes": [ 3388 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3388 ] , "outputIndexes": [ 3389 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.23/mlp/down_proj/Linear", "inputIndexes": [ 3389 ] , "outputIndexes": [ 3390 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 93549290, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.23/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3390 ] , "outputIndexes": [ 3391 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3391 ] , "outputIndexes": [ 2180 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_119_output_0", "inputIndexes": [ 2174, 2180 ] , "outputIndexes": [ 2181 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_216_output_0", "inputIndexes": [ 2181, 3 ] , "outputIndexes": [ 2182 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_24/Mul_1_output_0", "inputIndexes": [ 2182 ] , "outputIndexes": [ 2183 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 94489584, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2183 ] , "outputIndexes": [ 3392 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3392 ] , "outputIndexes": [ 3393 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/self_attn/q_proj/Linear", "inputIndexes": [ 3393 ] , "outputIndexes": [ 3394 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 94494192, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3394 ] , "outputIndexes": [ 3395 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3395 ] , "outputIndexes": [ 2184 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_336_output_0", "inputIndexes": [ 2183 ] , "outputIndexes": [ 2185 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9012", "inputIndexes": [ 2185 ] , "outputIndexes": [ 2186 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9014", "inputIndexes": [ 2185 ] , "outputIndexes": [ 2187 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9016", "inputIndexes": [ 2187, 2187 ] , "outputIndexes": [ 2188 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9017", "inputIndexes": [ 2188 ] , "outputIndexes": [ 2189 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9019", "inputIndexes": [ 2188, 12 ] , "outputIndexes": [ 2190 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9020", "inputIndexes": [ 2190 ] , "outputIndexes": [ 2191 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9023", "inputIndexes": [ 2186, 2189, 2191, 15 ] , "outputIndexes": [ 2192 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9024", "inputIndexes": [ 2192 ] , "outputIndexes": [ 2193 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9026", "inputIndexes": [ 2193, 2193 ] , "outputIndexes": [ 2194 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_363_output_0", "inputIndexes": [ 2185, 2194, 2188 ] , "outputIndexes": [ 2195 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_768_output_0", "inputIndexes": [ 2195, 20 ] , "outputIndexes": [ 2196 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9034", "inputIndexes": [ 2188 ] , "outputIndexes": [ 2197 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9037", "inputIndexes": [ 2190 ] , "outputIndexes": [ 2198 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9040", "inputIndexes": [ 2186, 2197, 2198, 15 ] , "outputIndexes": [ 2199 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9041", "inputIndexes": [ 2199 ] , "outputIndexes": [ 2200 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9042", "inputIndexes": [ 12, 2200 ] , "outputIndexes": [ 2201 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9043", "inputIndexes": [ 2201, 2200 ] , "outputIndexes": [ 2202 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_364_output_0", "inputIndexes": [ 2185, 2202, 2188 ] , "outputIndexes": [ 2203 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_769_output_0", "inputIndexes": [ 2203, 20 ] , "outputIndexes": [ 2204 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_312_output_0", "inputIndexes": [ 2196, 2204, 30, 31 ] , "outputIndexes": [ 2205 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_217_output_0", "inputIndexes": [ 2184, 2205 ] , "outputIndexes": [ 2206 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_192_output_0", "inputIndexes": [ 2206, 58 ] , "outputIndexes": [ 2207 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_338_output_0", "inputIndexes": [ 2206 ] , "outputIndexes": [ 2208 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9144", "inputIndexes": [ 2208 ] , "outputIndexes": [ 2209 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9146", "inputIndexes": [ 2208 ] , "outputIndexes": [ 2210 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9148", "inputIndexes": [ 2210, 2210 ] , "outputIndexes": [ 2211 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9149", "inputIndexes": [ 2211 ] , "outputIndexes": [ 2212 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9151", "inputIndexes": [ 2211, 12 ] , "outputIndexes": [ 2213 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9152", "inputIndexes": [ 2213 ] , "outputIndexes": [ 2214 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9155", "inputIndexes": [ 2209, 2212, 2214, 15 ] , "outputIndexes": [ 2215 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9156", "inputIndexes": [ 2215 ] , "outputIndexes": [ 2216 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9157", "inputIndexes": [ 61, 2216 ] , "outputIndexes": [ 2217 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9158", "inputIndexes": [ 2217, 2216 ] , "outputIndexes": [ 2218 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_365_output_0", "inputIndexes": [ 2208, 2218, 2211 ] , "outputIndexes": [ 2219 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_72_output_0", "inputIndexes": [ 2219, 73 ] , "outputIndexes": [ 2220 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_775_output_0", "inputIndexes": [ 2220, 20 ] , "outputIndexes": [ 2221 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_97_output_0", "inputIndexes": [ 2206, 2221, 76, 77, 15 ] , "outputIndexes": [ 2222 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_48_output_0", "inputIndexes": [ 2222 ] , "outputIndexes": [ 2223 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_774_output_0", "inputIndexes": [ 2220, 20 ] , "outputIndexes": [ 2224 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_96_output_0", "inputIndexes": [ 2206, 20, 2224, 77, 15 ] , "outputIndexes": [ 2225 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_315_output_0", "inputIndexes": [ 2223, 2225 ] , "outputIndexes": [ 2226 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_193_output_0", "inputIndexes": [ 2226, 89 ] , "outputIndexes": [ 2227 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_120_output_0", "inputIndexes": [ 2207, 2227 ] , "outputIndexes": [ 2228 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/self_attn/k_proj/Linear", "inputIndexes": [ 3393 ] , "outputIndexes": [ 3398 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 94867702, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3398 ] , "outputIndexes": [ 3399 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3399 ] , "outputIndexes": [ 2229 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_770_output_0", "inputIndexes": [ 2195, 20 ] , "outputIndexes": [ 2230 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_771_output_0", "inputIndexes": [ 2203, 20 ] , "outputIndexes": [ 2231 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_313_output_0", "inputIndexes": [ 2230, 2231, 77, 31 ] , "outputIndexes": [ 2232 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_218_output_0", "inputIndexes": [ 2229, 2232 ] , "outputIndexes": [ 2233 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_194_output_0", "inputIndexes": [ 2233, 58 ] , "outputIndexes": [ 2234 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_339_output_0", "inputIndexes": [ 2233 ] , "outputIndexes": [ 2235 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9050", "inputIndexes": [ 2235 ] , "outputIndexes": [ 2236 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9052", "inputIndexes": [ 2235 ] , "outputIndexes": [ 2237 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9054", "inputIndexes": [ 2237, 2237 ] , "outputIndexes": [ 2238 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9055", "inputIndexes": [ 2238 ] , "outputIndexes": [ 2239 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9057", "inputIndexes": [ 2238, 12 ] , "outputIndexes": [ 2240 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9058", "inputIndexes": [ 2240 ] , "outputIndexes": [ 2241 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9061", "inputIndexes": [ 2236, 2239, 2241, 15 ] , "outputIndexes": [ 2242 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9062", "inputIndexes": [ 2242 ] , "outputIndexes": [ 2243 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9063", "inputIndexes": [ 61, 2243 ] , "outputIndexes": [ 2244 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9064", "inputIndexes": [ 2244, 2243 ] , "outputIndexes": [ 2245 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_366_output_0", "inputIndexes": [ 2235, 2245, 2238 ] , "outputIndexes": [ 2246 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_73_output_0", "inputIndexes": [ 2246, 73 ] , "outputIndexes": [ 2247 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_777_output_0", "inputIndexes": [ 2247, 20 ] , "outputIndexes": [ 2248 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_99_output_0", "inputIndexes": [ 2233, 2248, 76, 77, 15 ] , "outputIndexes": [ 2249 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_49_output_0", "inputIndexes": [ 2249 ] , "outputIndexes": [ 2250 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_776_output_0", "inputIndexes": [ 2247, 20 ] , "outputIndexes": [ 2251 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_98_output_0", "inputIndexes": [ 2233, 20, 2251, 77, 15 ] , "outputIndexes": [ 2252 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_316_output_0", "inputIndexes": [ 2250, 2252 ] , "outputIndexes": [ 2253 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_195_output_0", "inputIndexes": [ 2253, 89 ] , "outputIndexes": [ 2254 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_121_output_0", "inputIndexes": [ 2234, 2254 ] , "outputIndexes": [ 2255 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/self_attn/v_proj/Linear", "inputIndexes": [ 3393 ] , "outputIndexes": [ 3402 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 94992380, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3402 ] , "outputIndexes": [ 3403 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3403 ] , "outputIndexes": [ 2256 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_772_output_0", "inputIndexes": [ 2195, 20 ] , "outputIndexes": [ 2257 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_773_output_0", "inputIndexes": [ 2203, 20 ] , "outputIndexes": [ 2258 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_314_output_0", "inputIndexes": [ 2257, 2258, 77, 31 ] , "outputIndexes": [ 2259 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_219_output_0", "inputIndexes": [ 2256, 2259 ] , "outputIndexes": [ 2260 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_224_output_0", "inputIndexes": [ 2228, 2255, 2260, 124 ] , "outputIndexes": [ 2261 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2261 ] , "outputIndexes": [ 3404 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3404 ] , "outputIndexes": [ 3405 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/self_attn/o_proj/Linear", "inputIndexes": [ 3405 ] , "outputIndexes": [ 3406 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 95117058, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3406 ] , "outputIndexes": [ 3407 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3407 ] , "outputIndexes": [ 2262 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_123_output_0", "inputIndexes": [ 2182, 2262 ] , "outputIndexes": [ 2263 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_24/Mul_1_output_0", "inputIndexes": [ 2263 ] , "outputIndexes": [ 2264 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 95490568, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2264 ] , "outputIndexes": [ 3408 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3408 ] , "outputIndexes": [ 3409 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/mlp/gate_proj/Linear", "inputIndexes": [ 3409 ] , "outputIndexes": [ 3410 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 95495176, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3410 ] , "outputIndexes": [ 3411 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3411 ] , "outputIndexes": [ 2265 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_24/Mul_output_0", "inputIndexes": [ 2265 ] , "outputIndexes": [ 2266 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/mlp/up_proj/Linear", "inputIndexes": [ 3409 ] , "outputIndexes": [ 3414 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 96490766, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3414 ] , "outputIndexes": [ 3415 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3415 ] , "outputIndexes": [ 2267 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_24/Mul_output_0", "inputIndexes": [ 2266, 2267 ] , "outputIndexes": [ 2268 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2268 ] , "outputIndexes": [ 3416 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3416 ] , "outputIndexes": [ 3417 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.24/mlp/down_proj/Linear", "inputIndexes": [ 3417 ] , "outputIndexes": [ 3418 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 97486356, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.24/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3418 ] , "outputIndexes": [ 3419 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.24/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3419 ] , "outputIndexes": [ 2269 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_124_output_0", "inputIndexes": [ 2263, 2269 ] , "outputIndexes": [ 2270 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_225_output_0", "inputIndexes": [ 2270, 3 ] , "outputIndexes": [ 2271 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_25/Mul_1_output_0", "inputIndexes": [ 2271 ] , "outputIndexes": [ 2272 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 98426650, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2272 ] , "outputIndexes": [ 3420 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3420 ] , "outputIndexes": [ 3421 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/self_attn/q_proj/Linear", "inputIndexes": [ 3421 ] , "outputIndexes": [ 3422 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 98431258, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3422 ] , "outputIndexes": [ 3423 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3423 ] , "outputIndexes": [ 2273 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_350_output_0", "inputIndexes": [ 2272 ] , "outputIndexes": [ 2274 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9383", "inputIndexes": [ 2274 ] , "outputIndexes": [ 2275 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9385", "inputIndexes": [ 2274 ] , "outputIndexes": [ 2276 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9387", "inputIndexes": [ 2276, 2276 ] , "outputIndexes": [ 2277 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9388", "inputIndexes": [ 2277 ] , "outputIndexes": [ 2278 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9390", "inputIndexes": [ 2277, 12 ] , "outputIndexes": [ 2279 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9391", "inputIndexes": [ 2279 ] , "outputIndexes": [ 2280 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9394", "inputIndexes": [ 2275, 2278, 2280, 15 ] , "outputIndexes": [ 2281 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9395", "inputIndexes": [ 2281 ] , "outputIndexes": [ 2282 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9397", "inputIndexes": [ 2282, 2282 ] , "outputIndexes": [ 2283 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_378_output_0", "inputIndexes": [ 2274, 2283, 2277 ] , "outputIndexes": [ 2284 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_800_output_0", "inputIndexes": [ 2284, 20 ] , "outputIndexes": [ 2285 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9405", "inputIndexes": [ 2277 ] , "outputIndexes": [ 2286 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9408", "inputIndexes": [ 2279 ] , "outputIndexes": [ 2287 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9411", "inputIndexes": [ 2275, 2286, 2287, 15 ] , "outputIndexes": [ 2288 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9412", "inputIndexes": [ 2288 ] , "outputIndexes": [ 2289 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9413", "inputIndexes": [ 12, 2289 ] , "outputIndexes": [ 2290 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9414", "inputIndexes": [ 2290, 2289 ] , "outputIndexes": [ 2291 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_379_output_0", "inputIndexes": [ 2274, 2291, 2277 ] , "outputIndexes": [ 2292 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_801_output_0", "inputIndexes": [ 2292, 20 ] , "outputIndexes": [ 2293 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_325_output_0", "inputIndexes": [ 2285, 2293, 30, 31 ] , "outputIndexes": [ 2294 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_226_output_0", "inputIndexes": [ 2273, 2294 ] , "outputIndexes": [ 2295 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_200_output_0", "inputIndexes": [ 2295, 58 ] , "outputIndexes": [ 2296 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_352_output_0", "inputIndexes": [ 2295 ] , "outputIndexes": [ 2297 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9515", "inputIndexes": [ 2297 ] , "outputIndexes": [ 2298 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9517", "inputIndexes": [ 2297 ] , "outputIndexes": [ 2299 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9519", "inputIndexes": [ 2299, 2299 ] , "outputIndexes": [ 2300 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9520", "inputIndexes": [ 2300 ] , "outputIndexes": [ 2301 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9522", "inputIndexes": [ 2300, 12 ] , "outputIndexes": [ 2302 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9523", "inputIndexes": [ 2302 ] , "outputIndexes": [ 2303 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9526", "inputIndexes": [ 2298, 2301, 2303, 15 ] , "outputIndexes": [ 2304 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9527", "inputIndexes": [ 2304 ] , "outputIndexes": [ 2305 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9528", "inputIndexes": [ 61, 2305 ] , "outputIndexes": [ 2306 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9529", "inputIndexes": [ 2306, 2305 ] , "outputIndexes": [ 2307 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_380_output_0", "inputIndexes": [ 2297, 2307, 2300 ] , "outputIndexes": [ 2308 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_75_output_0", "inputIndexes": [ 2308, 73 ] , "outputIndexes": [ 2309 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_807_output_0", "inputIndexes": [ 2309, 20 ] , "outputIndexes": [ 2310 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_101_output_0", "inputIndexes": [ 2295, 2310, 76, 77, 15 ] , "outputIndexes": [ 2311 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_50_output_0", "inputIndexes": [ 2311 ] , "outputIndexes": [ 2312 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_806_output_0", "inputIndexes": [ 2309, 20 ] , "outputIndexes": [ 2313 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_100_output_0", "inputIndexes": [ 2295, 20, 2313, 77, 15 ] , "outputIndexes": [ 2314 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_328_output_0", "inputIndexes": [ 2312, 2314 ] , "outputIndexes": [ 2315 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_201_output_0", "inputIndexes": [ 2315, 89 ] , "outputIndexes": [ 2316 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_125_output_0", "inputIndexes": [ 2296, 2316 ] , "outputIndexes": [ 2317 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/self_attn/k_proj/Linear", "inputIndexes": [ 3421 ] , "outputIndexes": [ 3426 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 98804768, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3426 ] , "outputIndexes": [ 3427 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3427 ] , "outputIndexes": [ 2318 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_802_output_0", "inputIndexes": [ 2284, 20 ] , "outputIndexes": [ 2319 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_803_output_0", "inputIndexes": [ 2292, 20 ] , "outputIndexes": [ 2320 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_326_output_0", "inputIndexes": [ 2319, 2320, 77, 31 ] , "outputIndexes": [ 2321 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_227_output_0", "inputIndexes": [ 2318, 2321 ] , "outputIndexes": [ 2322 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_202_output_0", "inputIndexes": [ 2322, 58 ] , "outputIndexes": [ 2323 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_353_output_0", "inputIndexes": [ 2322 ] , "outputIndexes": [ 2324 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9421", "inputIndexes": [ 2324 ] , "outputIndexes": [ 2325 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9423", "inputIndexes": [ 2324 ] , "outputIndexes": [ 2326 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9425", "inputIndexes": [ 2326, 2326 ] , "outputIndexes": [ 2327 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9426", "inputIndexes": [ 2327 ] , "outputIndexes": [ 2328 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9428", "inputIndexes": [ 2327, 12 ] , "outputIndexes": [ 2329 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9429", "inputIndexes": [ 2329 ] , "outputIndexes": [ 2330 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9432", "inputIndexes": [ 2325, 2328, 2330, 15 ] , "outputIndexes": [ 2331 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9433", "inputIndexes": [ 2331 ] , "outputIndexes": [ 2332 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9434", "inputIndexes": [ 61, 2332 ] , "outputIndexes": [ 2333 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9435", "inputIndexes": [ 2333, 2332 ] , "outputIndexes": [ 2334 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_381_output_0", "inputIndexes": [ 2324, 2334, 2327 ] , "outputIndexes": [ 2335 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_76_output_0", "inputIndexes": [ 2335, 73 ] , "outputIndexes": [ 2336 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_809_output_0", "inputIndexes": [ 2336, 20 ] , "outputIndexes": [ 2337 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_103_output_0", "inputIndexes": [ 2322, 2337, 76, 77, 15 ] , "outputIndexes": [ 2338 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_51_output_0", "inputIndexes": [ 2338 ] , "outputIndexes": [ 2339 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_808_output_0", "inputIndexes": [ 2336, 20 ] , "outputIndexes": [ 2340 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_102_output_0", "inputIndexes": [ 2322, 20, 2340, 77, 15 ] , "outputIndexes": [ 2341 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_329_output_0", "inputIndexes": [ 2339, 2341 ] , "outputIndexes": [ 2342 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_203_output_0", "inputIndexes": [ 2342, 89 ] , "outputIndexes": [ 2343 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_126_output_0", "inputIndexes": [ 2323, 2343 ] , "outputIndexes": [ 2344 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/self_attn/v_proj/Linear", "inputIndexes": [ 3421 ] , "outputIndexes": [ 3430 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 98929446, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3430 ] , "outputIndexes": [ 3431 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3431 ] , "outputIndexes": [ 2345 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_804_output_0", "inputIndexes": [ 2284, 20 ] , "outputIndexes": [ 2346 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_805_output_0", "inputIndexes": [ 2292, 20 ] , "outputIndexes": [ 2347 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_327_output_0", "inputIndexes": [ 2346, 2347, 77, 31 ] , "outputIndexes": [ 2348 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_228_output_0", "inputIndexes": [ 2345, 2348 ] , "outputIndexes": [ 2349 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_233_output_0", "inputIndexes": [ 2317, 2344, 2349, 124 ] , "outputIndexes": [ 2350 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2350 ] , "outputIndexes": [ 3432 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3432 ] , "outputIndexes": [ 3433 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/self_attn/o_proj/Linear", "inputIndexes": [ 3433 ] , "outputIndexes": [ 3434 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 99054124, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3434 ] , "outputIndexes": [ 3435 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3435 ] , "outputIndexes": [ 2351 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_128_output_0", "inputIndexes": [ 2271, 2351 ] , "outputIndexes": [ 2352 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_25/Mul_1_output_0", "inputIndexes": [ 2352 ] , "outputIndexes": [ 2353 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 99427634, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2353 ] , "outputIndexes": [ 3436 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3436 ] , "outputIndexes": [ 3437 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/mlp/gate_proj/Linear", "inputIndexes": [ 3437 ] , "outputIndexes": [ 3438 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 99432242, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3438 ] , "outputIndexes": [ 3439 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3439 ] , "outputIndexes": [ 2354 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_25/Mul_output_0", "inputIndexes": [ 2354 ] , "outputIndexes": [ 2355 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/mlp/up_proj/Linear", "inputIndexes": [ 3437 ] , "outputIndexes": [ 3442 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 100427832, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3442 ] , "outputIndexes": [ 3443 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3443 ] , "outputIndexes": [ 2356 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_25/Mul_output_0", "inputIndexes": [ 2355, 2356 ] , "outputIndexes": [ 2357 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2357 ] , "outputIndexes": [ 3444 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3444 ] , "outputIndexes": [ 3445 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.25/mlp/down_proj/Linear", "inputIndexes": [ 3445 ] , "outputIndexes": [ 3446 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 101423422, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.25/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3446 ] , "outputIndexes": [ 3447 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.25/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3447 ] , "outputIndexes": [ 2358 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_129_output_0", "inputIndexes": [ 2352, 2358 ] , "outputIndexes": [ 2359 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_234_output_0", "inputIndexes": [ 2359, 3 ] , "outputIndexes": [ 2360 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_26/Mul_1_output_0", "inputIndexes": [ 2360 ] , "outputIndexes": [ 2361 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 102363716, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2361 ] , "outputIndexes": [ 3448 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3448 ] , "outputIndexes": [ 3449 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/self_attn/q_proj/Linear", "inputIndexes": [ 3449 ] , "outputIndexes": [ 3450 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102368324, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3450 ] , "outputIndexes": [ 3451 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3451 ] , "outputIndexes": [ 2362 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_364_output_0", "inputIndexes": [ 2361 ] , "outputIndexes": [ 2363 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9754", "inputIndexes": [ 2363 ] , "outputIndexes": [ 2364 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9756", "inputIndexes": [ 2363 ] , "outputIndexes": [ 2365 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9758", "inputIndexes": [ 2365, 2365 ] , "outputIndexes": [ 2366 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9759", "inputIndexes": [ 2366 ] , "outputIndexes": [ 2367 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9761", "inputIndexes": [ 2366, 12 ] , "outputIndexes": [ 2368 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9762", "inputIndexes": [ 2368 ] , "outputIndexes": [ 2369 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9765", "inputIndexes": [ 2364, 2367, 2369, 15 ] , "outputIndexes": [ 2370 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9766", "inputIndexes": [ 2370 ] , "outputIndexes": [ 2371 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9768", "inputIndexes": [ 2371, 2371 ] , "outputIndexes": [ 2372 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_393_output_0", "inputIndexes": [ 2363, 2372, 2366 ] , "outputIndexes": [ 2373 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_832_output_0", "inputIndexes": [ 2373, 20 ] , "outputIndexes": [ 2374 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9776", "inputIndexes": [ 2366 ] , "outputIndexes": [ 2375 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9779", "inputIndexes": [ 2368 ] , "outputIndexes": [ 2376 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9782", "inputIndexes": [ 2364, 2375, 2376, 15 ] , "outputIndexes": [ 2377 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9783", "inputIndexes": [ 2377 ] , "outputIndexes": [ 2378 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9784", "inputIndexes": [ 12, 2378 ] , "outputIndexes": [ 2379 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9785", "inputIndexes": [ 2379, 2378 ] , "outputIndexes": [ 2380 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_394_output_0", "inputIndexes": [ 2363, 2380, 2366 ] , "outputIndexes": [ 2381 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_833_output_0", "inputIndexes": [ 2381, 20 ] , "outputIndexes": [ 2382 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_338_output_0", "inputIndexes": [ 2374, 2382, 30, 31 ] , "outputIndexes": [ 2383 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_235_output_0", "inputIndexes": [ 2362, 2383 ] , "outputIndexes": [ 2384 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_208_output_0", "inputIndexes": [ 2384, 58 ] , "outputIndexes": [ 2385 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_366_output_0", "inputIndexes": [ 2384 ] , "outputIndexes": [ 2386 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9886", "inputIndexes": [ 2386 ] , "outputIndexes": [ 2387 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9888", "inputIndexes": [ 2386 ] , "outputIndexes": [ 2388 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9890", "inputIndexes": [ 2388, 2388 ] , "outputIndexes": [ 2389 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9891", "inputIndexes": [ 2389 ] , "outputIndexes": [ 2390 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9893", "inputIndexes": [ 2389, 12 ] , "outputIndexes": [ 2391 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9894", "inputIndexes": [ 2391 ] , "outputIndexes": [ 2392 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9897", "inputIndexes": [ 2387, 2390, 2392, 15 ] , "outputIndexes": [ 2393 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9898", "inputIndexes": [ 2393 ] , "outputIndexes": [ 2394 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9899", "inputIndexes": [ 61, 2394 ] , "outputIndexes": [ 2395 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9900", "inputIndexes": [ 2395, 2394 ] , "outputIndexes": [ 2396 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_395_output_0", "inputIndexes": [ 2386, 2396, 2389 ] , "outputIndexes": [ 2397 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_78_output_0", "inputIndexes": [ 2397, 73 ] , "outputIndexes": [ 2398 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_839_output_0", "inputIndexes": [ 2398, 20 ] , "outputIndexes": [ 2399 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_105_output_0", "inputIndexes": [ 2384, 2399, 76, 77, 15 ] , "outputIndexes": [ 2400 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_52_output_0", "inputIndexes": [ 2400 ] , "outputIndexes": [ 2401 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_838_output_0", "inputIndexes": [ 2398, 20 ] , "outputIndexes": [ 2402 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_104_output_0", "inputIndexes": [ 2384, 20, 2402, 77, 15 ] , "outputIndexes": [ 2403 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_341_output_0", "inputIndexes": [ 2401, 2403 ] , "outputIndexes": [ 2404 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_209_output_0", "inputIndexes": [ 2404, 89 ] , "outputIndexes": [ 2405 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_130_output_0", "inputIndexes": [ 2385, 2405 ] , "outputIndexes": [ 2406 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/self_attn/k_proj/Linear", "inputIndexes": [ 3449 ] , "outputIndexes": [ 3454 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102741834, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3454 ] , "outputIndexes": [ 3455 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3455 ] , "outputIndexes": [ 2407 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_834_output_0", "inputIndexes": [ 2373, 20 ] , "outputIndexes": [ 2408 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_835_output_0", "inputIndexes": [ 2381, 20 ] , "outputIndexes": [ 2409 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_339_output_0", "inputIndexes": [ 2408, 2409, 77, 31 ] , "outputIndexes": [ 2410 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_236_output_0", "inputIndexes": [ 2407, 2410 ] , "outputIndexes": [ 2411 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_210_output_0", "inputIndexes": [ 2411, 58 ] , "outputIndexes": [ 2412 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_367_output_0", "inputIndexes": [ 2411 ] , "outputIndexes": [ 2413 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape9792", "inputIndexes": [ 2413 ] , "outputIndexes": [ 2414 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank9794", "inputIndexes": [ 2413 ] , "outputIndexes": [ 2415 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9796", "inputIndexes": [ 2415, 2415 ] , "outputIndexes": [ 2416 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9797", "inputIndexes": [ 2416 ] , "outputIndexes": [ 2417 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9799", "inputIndexes": [ 2416, 12 ] , "outputIndexes": [ 2418 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze9800", "inputIndexes": [ 2418 ] , "outputIndexes": [ 2419 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice9803", "inputIndexes": [ 2414, 2417, 2419, 15 ] , "outputIndexes": [ 2420 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze9804", "inputIndexes": [ 2420 ] , "outputIndexes": [ 2421 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9805", "inputIndexes": [ 61, 2421 ] , "outputIndexes": [ 2422 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp9806", "inputIndexes": [ 2422, 2421 ] , "outputIndexes": [ 2423 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_396_output_0", "inputIndexes": [ 2413, 2423, 2416 ] , "outputIndexes": [ 2424 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_79_output_0", "inputIndexes": [ 2424, 73 ] , "outputIndexes": [ 2425 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_841_output_0", "inputIndexes": [ 2425, 20 ] , "outputIndexes": [ 2426 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_107_output_0", "inputIndexes": [ 2411, 2426, 76, 77, 15 ] , "outputIndexes": [ 2427 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_53_output_0", "inputIndexes": [ 2427 ] , "outputIndexes": [ 2428 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_840_output_0", "inputIndexes": [ 2425, 20 ] , "outputIndexes": [ 2429 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_106_output_0", "inputIndexes": [ 2411, 20, 2429, 77, 15 ] , "outputIndexes": [ 2430 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_342_output_0", "inputIndexes": [ 2428, 2430 ] , "outputIndexes": [ 2431 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_211_output_0", "inputIndexes": [ 2431, 89 ] , "outputIndexes": [ 2432 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_131_output_0", "inputIndexes": [ 2412, 2432 ] , "outputIndexes": [ 2433 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/self_attn/v_proj/Linear", "inputIndexes": [ 3449 ] , "outputIndexes": [ 3458 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102866512, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3458 ] , "outputIndexes": [ 3459 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3459 ] , "outputIndexes": [ 2434 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_836_output_0", "inputIndexes": [ 2373, 20 ] , "outputIndexes": [ 2435 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_837_output_0", "inputIndexes": [ 2381, 20 ] , "outputIndexes": [ 2436 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_340_output_0", "inputIndexes": [ 2435, 2436, 77, 31 ] , "outputIndexes": [ 2437 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_237_output_0", "inputIndexes": [ 2434, 2437 ] , "outputIndexes": [ 2438 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_242_output_0", "inputIndexes": [ 2406, 2433, 2438, 124 ] , "outputIndexes": [ 2439 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2439 ] , "outputIndexes": [ 3460 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3460 ] , "outputIndexes": [ 3461 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/self_attn/o_proj/Linear", "inputIndexes": [ 3461 ] , "outputIndexes": [ 3462 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102991190, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3462 ] , "outputIndexes": [ 3463 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3463 ] , "outputIndexes": [ 2440 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_133_output_0", "inputIndexes": [ 2360, 2440 ] , "outputIndexes": [ 2441 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_26/Mul_1_output_0", "inputIndexes": [ 2441 ] , "outputIndexes": [ 2442 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 103364700, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2442 ] , "outputIndexes": [ 3464 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3464 ] , "outputIndexes": [ 3465 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/mlp/gate_proj/Linear", "inputIndexes": [ 3465 ] , "outputIndexes": [ 3466 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103369308, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3466 ] , "outputIndexes": [ 3467 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3467 ] , "outputIndexes": [ 2443 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_26/Mul_output_0", "inputIndexes": [ 2443 ] , "outputIndexes": [ 2444 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/mlp/up_proj/Linear", "inputIndexes": [ 3465 ] , "outputIndexes": [ 3470 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 104364898, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3470 ] , "outputIndexes": [ 3471 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3471 ] , "outputIndexes": [ 2445 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_26/Mul_output_0", "inputIndexes": [ 2444, 2445 ] , "outputIndexes": [ 2446 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2446 ] , "outputIndexes": [ 3472 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3472 ] , "outputIndexes": [ 3473 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.26/mlp/down_proj/Linear", "inputIndexes": [ 3473 ] , "outputIndexes": [ 3474 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 105360488, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.26/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3474 ] , "outputIndexes": [ 3475 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.26/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3475 ] , "outputIndexes": [ 2447 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_134_output_0", "inputIndexes": [ 2441, 2447 ] , "outputIndexes": [ 2448 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_243_output_0", "inputIndexes": [ 2448, 3 ] , "outputIndexes": [ 2449 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_27/Mul_1_output_0", "inputIndexes": [ 2449 ] , "outputIndexes": [ 2450 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 106300782, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2450 ] , "outputIndexes": [ 3476 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3476 ] , "outputIndexes": [ 3477 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/self_attn/q_proj/Linear", "inputIndexes": [ 3477 ] , "outputIndexes": [ 3478 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106305390, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3478 ] , "outputIndexes": [ 3479 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3479 ] , "outputIndexes": [ 2451 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_378_output_0", "inputIndexes": [ 2450 ] , "outputIndexes": [ 2452 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10125", "inputIndexes": [ 2452 ] , "outputIndexes": [ 2453 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10127", "inputIndexes": [ 2452 ] , "outputIndexes": [ 2454 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10129", "inputIndexes": [ 2454, 2454 ] , "outputIndexes": [ 2455 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10130", "inputIndexes": [ 2455 ] , "outputIndexes": [ 2456 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10132", "inputIndexes": [ 2455, 12 ] , "outputIndexes": [ 2457 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10133", "inputIndexes": [ 2457 ] , "outputIndexes": [ 2458 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10136", "inputIndexes": [ 2453, 2456, 2458, 15 ] , "outputIndexes": [ 2459 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10137", "inputIndexes": [ 2459 ] , "outputIndexes": [ 2460 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10139", "inputIndexes": [ 2460, 2460 ] , "outputIndexes": [ 2461 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_408_output_0", "inputIndexes": [ 2452, 2461, 2455 ] , "outputIndexes": [ 2462 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_864_output_0", "inputIndexes": [ 2462, 20 ] , "outputIndexes": [ 2463 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10147", "inputIndexes": [ 2455 ] , "outputIndexes": [ 2464 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10150", "inputIndexes": [ 2457 ] , "outputIndexes": [ 2465 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10153", "inputIndexes": [ 2453, 2464, 2465, 15 ] , "outputIndexes": [ 2466 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10154", "inputIndexes": [ 2466 ] , "outputIndexes": [ 2467 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10155", "inputIndexes": [ 12, 2467 ] , "outputIndexes": [ 2468 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10156", "inputIndexes": [ 2468, 2467 ] , "outputIndexes": [ 2469 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_409_output_0", "inputIndexes": [ 2452, 2469, 2455 ] , "outputIndexes": [ 2470 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_865_output_0", "inputIndexes": [ 2470, 20 ] , "outputIndexes": [ 2471 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_351_output_0", "inputIndexes": [ 2463, 2471, 30, 31 ] , "outputIndexes": [ 2472 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_244_output_0", "inputIndexes": [ 2451, 2472 ] , "outputIndexes": [ 2473 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_216_output_0", "inputIndexes": [ 2473, 58 ] , "outputIndexes": [ 2474 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_380_output_0", "inputIndexes": [ 2473 ] , "outputIndexes": [ 2475 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10257", "inputIndexes": [ 2475 ] , "outputIndexes": [ 2476 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10259", "inputIndexes": [ 2475 ] , "outputIndexes": [ 2477 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10261", "inputIndexes": [ 2477, 2477 ] , "outputIndexes": [ 2478 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10262", "inputIndexes": [ 2478 ] , "outputIndexes": [ 2479 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10264", "inputIndexes": [ 2478, 12 ] , "outputIndexes": [ 2480 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10265", "inputIndexes": [ 2480 ] , "outputIndexes": [ 2481 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10268", "inputIndexes": [ 2476, 2479, 2481, 15 ] , "outputIndexes": [ 2482 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10269", "inputIndexes": [ 2482 ] , "outputIndexes": [ 2483 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10270", "inputIndexes": [ 61, 2483 ] , "outputIndexes": [ 2484 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10271", "inputIndexes": [ 2484, 2483 ] , "outputIndexes": [ 2485 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_410_output_0", "inputIndexes": [ 2475, 2485, 2478 ] , "outputIndexes": [ 2486 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_81_output_0", "inputIndexes": [ 2486, 73 ] , "outputIndexes": [ 2487 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_871_output_0", "inputIndexes": [ 2487, 20 ] , "outputIndexes": [ 2488 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_109_output_0", "inputIndexes": [ 2473, 2488, 76, 77, 15 ] , "outputIndexes": [ 2489 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_54_output_0", "inputIndexes": [ 2489 ] , "outputIndexes": [ 2490 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_870_output_0", "inputIndexes": [ 2487, 20 ] , "outputIndexes": [ 2491 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_108_output_0", "inputIndexes": [ 2473, 20, 2491, 77, 15 ] , "outputIndexes": [ 2492 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_354_output_0", "inputIndexes": [ 2490, 2492 ] , "outputIndexes": [ 2493 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_217_output_0", "inputIndexes": [ 2493, 89 ] , "outputIndexes": [ 2494 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_135_output_0", "inputIndexes": [ 2474, 2494 ] , "outputIndexes": [ 2495 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/self_attn/k_proj/Linear", "inputIndexes": [ 3477 ] , "outputIndexes": [ 3482 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106678900, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3482 ] , "outputIndexes": [ 3483 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3483 ] , "outputIndexes": [ 2496 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_866_output_0", "inputIndexes": [ 2462, 20 ] , "outputIndexes": [ 2497 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_867_output_0", "inputIndexes": [ 2470, 20 ] , "outputIndexes": [ 2498 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_352_output_0", "inputIndexes": [ 2497, 2498, 77, 31 ] , "outputIndexes": [ 2499 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_245_output_0", "inputIndexes": [ 2496, 2499 ] , "outputIndexes": [ 2500 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_218_output_0", "inputIndexes": [ 2500, 58 ] , "outputIndexes": [ 2501 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_381_output_0", "inputIndexes": [ 2500 ] , "outputIndexes": [ 2502 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10163", "inputIndexes": [ 2502 ] , "outputIndexes": [ 2503 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10165", "inputIndexes": [ 2502 ] , "outputIndexes": [ 2504 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10167", "inputIndexes": [ 2504, 2504 ] , "outputIndexes": [ 2505 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10168", "inputIndexes": [ 2505 ] , "outputIndexes": [ 2506 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10170", "inputIndexes": [ 2505, 12 ] , "outputIndexes": [ 2507 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10171", "inputIndexes": [ 2507 ] , "outputIndexes": [ 2508 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10174", "inputIndexes": [ 2503, 2506, 2508, 15 ] , "outputIndexes": [ 2509 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10175", "inputIndexes": [ 2509 ] , "outputIndexes": [ 2510 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10176", "inputIndexes": [ 61, 2510 ] , "outputIndexes": [ 2511 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10177", "inputIndexes": [ 2511, 2510 ] , "outputIndexes": [ 2512 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_411_output_0", "inputIndexes": [ 2502, 2512, 2505 ] , "outputIndexes": [ 2513 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_82_output_0", "inputIndexes": [ 2513, 73 ] , "outputIndexes": [ 2514 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_873_output_0", "inputIndexes": [ 2514, 20 ] , "outputIndexes": [ 2515 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_111_output_0", "inputIndexes": [ 2500, 2515, 76, 77, 15 ] , "outputIndexes": [ 2516 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_55_output_0", "inputIndexes": [ 2516 ] , "outputIndexes": [ 2517 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_872_output_0", "inputIndexes": [ 2514, 20 ] , "outputIndexes": [ 2518 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_110_output_0", "inputIndexes": [ 2500, 20, 2518, 77, 15 ] , "outputIndexes": [ 2519 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_355_output_0", "inputIndexes": [ 2517, 2519 ] , "outputIndexes": [ 2520 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_219_output_0", "inputIndexes": [ 2520, 89 ] , "outputIndexes": [ 2521 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_136_output_0", "inputIndexes": [ 2501, 2521 ] , "outputIndexes": [ 2522 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/self_attn/v_proj/Linear", "inputIndexes": [ 3477 ] , "outputIndexes": [ 3486 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106803578, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3486 ] , "outputIndexes": [ 3487 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3487 ] , "outputIndexes": [ 2523 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_868_output_0", "inputIndexes": [ 2462, 20 ] , "outputIndexes": [ 2524 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_869_output_0", "inputIndexes": [ 2470, 20 ] , "outputIndexes": [ 2525 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_353_output_0", "inputIndexes": [ 2524, 2525, 77, 31 ] , "outputIndexes": [ 2526 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_246_output_0", "inputIndexes": [ 2523, 2526 ] , "outputIndexes": [ 2527 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_251_output_0", "inputIndexes": [ 2495, 2522, 2527, 124 ] , "outputIndexes": [ 2528 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2528 ] , "outputIndexes": [ 3488 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3488 ] , "outputIndexes": [ 3489 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/self_attn/o_proj/Linear", "inputIndexes": [ 3489 ] , "outputIndexes": [ 3490 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106928256, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3490 ] , "outputIndexes": [ 3491 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3491 ] , "outputIndexes": [ 2529 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_138_output_0", "inputIndexes": [ 2449, 2529 ] , "outputIndexes": [ 2530 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_27/Mul_1_output_0", "inputIndexes": [ 2530 ] , "outputIndexes": [ 2531 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 107301766, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2531 ] , "outputIndexes": [ 3492 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3492 ] , "outputIndexes": [ 3493 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/mlp/gate_proj/Linear", "inputIndexes": [ 3493 ] , "outputIndexes": [ 3494 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 107306374, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3494 ] , "outputIndexes": [ 3495 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3495 ] , "outputIndexes": [ 2532 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_27/Mul_output_0", "inputIndexes": [ 2532 ] , "outputIndexes": [ 2533 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/mlp/up_proj/Linear", "inputIndexes": [ 3493 ] , "outputIndexes": [ 3498 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 108301964, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3498 ] , "outputIndexes": [ 3499 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3499 ] , "outputIndexes": [ 2534 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_27/Mul_output_0", "inputIndexes": [ 2533, 2534 ] , "outputIndexes": [ 2535 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2535 ] , "outputIndexes": [ 3500 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3500 ] , "outputIndexes": [ 3501 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.27/mlp/down_proj/Linear", "inputIndexes": [ 3501 ] , "outputIndexes": [ 3502 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 109297554, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.27/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3502 ] , "outputIndexes": [ 3503 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.27/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3503 ] , "outputIndexes": [ 2536 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_139_output_0", "inputIndexes": [ 2530, 2536 ] , "outputIndexes": [ 2537 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_252_output_0", "inputIndexes": [ 2537, 3 ] , "outputIndexes": [ 2538 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_28/Mul_1_output_0", "inputIndexes": [ 2538 ] , "outputIndexes": [ 2539 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 110237848, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2539 ] , "outputIndexes": [ 3504 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3504 ] , "outputIndexes": [ 3505 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/self_attn/q_proj/Linear", "inputIndexes": [ 3505 ] , "outputIndexes": [ 3506 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 110242456, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3506 ] , "outputIndexes": [ 3507 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3507 ] , "outputIndexes": [ 2540 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_392_output_0", "inputIndexes": [ 2539 ] , "outputIndexes": [ 2541 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10496", "inputIndexes": [ 2541 ] , "outputIndexes": [ 2542 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10498", "inputIndexes": [ 2541 ] , "outputIndexes": [ 2543 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10500", "inputIndexes": [ 2543, 2543 ] , "outputIndexes": [ 2544 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10501", "inputIndexes": [ 2544 ] , "outputIndexes": [ 2545 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10503", "inputIndexes": [ 2544, 12 ] , "outputIndexes": [ 2546 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10504", "inputIndexes": [ 2546 ] , "outputIndexes": [ 2547 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10507", "inputIndexes": [ 2542, 2545, 2547, 15 ] , "outputIndexes": [ 2548 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10508", "inputIndexes": [ 2548 ] , "outputIndexes": [ 2549 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10510", "inputIndexes": [ 2549, 2549 ] , "outputIndexes": [ 2550 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_423_output_0", "inputIndexes": [ 2541, 2550, 2544 ] , "outputIndexes": [ 2551 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_896_output_0", "inputIndexes": [ 2551, 20 ] , "outputIndexes": [ 2552 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10518", "inputIndexes": [ 2544 ] , "outputIndexes": [ 2553 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10521", "inputIndexes": [ 2546 ] , "outputIndexes": [ 2554 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10524", "inputIndexes": [ 2542, 2553, 2554, 15 ] , "outputIndexes": [ 2555 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10525", "inputIndexes": [ 2555 ] , "outputIndexes": [ 2556 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10526", "inputIndexes": [ 12, 2556 ] , "outputIndexes": [ 2557 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10527", "inputIndexes": [ 2557, 2556 ] , "outputIndexes": [ 2558 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_424_output_0", "inputIndexes": [ 2541, 2558, 2544 ] , "outputIndexes": [ 2559 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_897_output_0", "inputIndexes": [ 2559, 20 ] , "outputIndexes": [ 2560 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_364_output_0", "inputIndexes": [ 2552, 2560, 30, 31 ] , "outputIndexes": [ 2561 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_253_output_0", "inputIndexes": [ 2540, 2561 ] , "outputIndexes": [ 2562 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_224_output_0", "inputIndexes": [ 2562, 58 ] , "outputIndexes": [ 2563 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_394_output_0", "inputIndexes": [ 2562 ] , "outputIndexes": [ 2564 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10628", "inputIndexes": [ 2564 ] , "outputIndexes": [ 2565 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10630", "inputIndexes": [ 2564 ] , "outputIndexes": [ 2566 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10632", "inputIndexes": [ 2566, 2566 ] , "outputIndexes": [ 2567 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10633", "inputIndexes": [ 2567 ] , "outputIndexes": [ 2568 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10635", "inputIndexes": [ 2567, 12 ] , "outputIndexes": [ 2569 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10636", "inputIndexes": [ 2569 ] , "outputIndexes": [ 2570 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10639", "inputIndexes": [ 2565, 2568, 2570, 15 ] , "outputIndexes": [ 2571 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10640", "inputIndexes": [ 2571 ] , "outputIndexes": [ 2572 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10641", "inputIndexes": [ 61, 2572 ] , "outputIndexes": [ 2573 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10642", "inputIndexes": [ 2573, 2572 ] , "outputIndexes": [ 2574 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_425_output_0", "inputIndexes": [ 2564, 2574, 2567 ] , "outputIndexes": [ 2575 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_84_output_0", "inputIndexes": [ 2575, 73 ] , "outputIndexes": [ 2576 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_903_output_0", "inputIndexes": [ 2576, 20 ] , "outputIndexes": [ 2577 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_113_output_0", "inputIndexes": [ 2562, 2577, 76, 77, 15 ] , "outputIndexes": [ 2578 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_56_output_0", "inputIndexes": [ 2578 ] , "outputIndexes": [ 2579 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_902_output_0", "inputIndexes": [ 2576, 20 ] , "outputIndexes": [ 2580 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_112_output_0", "inputIndexes": [ 2562, 20, 2580, 77, 15 ] , "outputIndexes": [ 2581 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_367_output_0", "inputIndexes": [ 2579, 2581 ] , "outputIndexes": [ 2582 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_225_output_0", "inputIndexes": [ 2582, 89 ] , "outputIndexes": [ 2583 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_140_output_0", "inputIndexes": [ 2563, 2583 ] , "outputIndexes": [ 2584 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/self_attn/k_proj/Linear", "inputIndexes": [ 3505 ] , "outputIndexes": [ 3510 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 110615966, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3510 ] , "outputIndexes": [ 3511 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3511 ] , "outputIndexes": [ 2585 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_898_output_0", "inputIndexes": [ 2551, 20 ] , "outputIndexes": [ 2586 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_899_output_0", "inputIndexes": [ 2559, 20 ] , "outputIndexes": [ 2587 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_365_output_0", "inputIndexes": [ 2586, 2587, 77, 31 ] , "outputIndexes": [ 2588 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_254_output_0", "inputIndexes": [ 2585, 2588 ] , "outputIndexes": [ 2589 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_226_output_0", "inputIndexes": [ 2589, 58 ] , "outputIndexes": [ 2590 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_395_output_0", "inputIndexes": [ 2589 ] , "outputIndexes": [ 2591 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10534", "inputIndexes": [ 2591 ] , "outputIndexes": [ 2592 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10536", "inputIndexes": [ 2591 ] , "outputIndexes": [ 2593 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10538", "inputIndexes": [ 2593, 2593 ] , "outputIndexes": [ 2594 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10539", "inputIndexes": [ 2594 ] , "outputIndexes": [ 2595 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10541", "inputIndexes": [ 2594, 12 ] , "outputIndexes": [ 2596 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10542", "inputIndexes": [ 2596 ] , "outputIndexes": [ 2597 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10545", "inputIndexes": [ 2592, 2595, 2597, 15 ] , "outputIndexes": [ 2598 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10546", "inputIndexes": [ 2598 ] , "outputIndexes": [ 2599 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10547", "inputIndexes": [ 61, 2599 ] , "outputIndexes": [ 2600 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10548", "inputIndexes": [ 2600, 2599 ] , "outputIndexes": [ 2601 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_426_output_0", "inputIndexes": [ 2591, 2601, 2594 ] , "outputIndexes": [ 2602 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_85_output_0", "inputIndexes": [ 2602, 73 ] , "outputIndexes": [ 2603 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_905_output_0", "inputIndexes": [ 2603, 20 ] , "outputIndexes": [ 2604 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_115_output_0", "inputIndexes": [ 2589, 2604, 76, 77, 15 ] , "outputIndexes": [ 2605 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_57_output_0", "inputIndexes": [ 2605 ] , "outputIndexes": [ 2606 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_904_output_0", "inputIndexes": [ 2603, 20 ] , "outputIndexes": [ 2607 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_114_output_0", "inputIndexes": [ 2589, 20, 2607, 77, 15 ] , "outputIndexes": [ 2608 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_368_output_0", "inputIndexes": [ 2606, 2608 ] , "outputIndexes": [ 2609 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_227_output_0", "inputIndexes": [ 2609, 89 ] , "outputIndexes": [ 2610 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_141_output_0", "inputIndexes": [ 2590, 2610 ] , "outputIndexes": [ 2611 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/self_attn/v_proj/Linear", "inputIndexes": [ 3505 ] , "outputIndexes": [ 3514 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 110740644, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3514 ] , "outputIndexes": [ 3515 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3515 ] , "outputIndexes": [ 2612 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_900_output_0", "inputIndexes": [ 2551, 20 ] , "outputIndexes": [ 2613 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_901_output_0", "inputIndexes": [ 2559, 20 ] , "outputIndexes": [ 2614 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_366_output_0", "inputIndexes": [ 2613, 2614, 77, 31 ] , "outputIndexes": [ 2615 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_255_output_0", "inputIndexes": [ 2612, 2615 ] , "outputIndexes": [ 2616 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_260_output_0", "inputIndexes": [ 2584, 2611, 2616, 124 ] , "outputIndexes": [ 2617 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2617 ] , "outputIndexes": [ 3516 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3516 ] , "outputIndexes": [ 3517 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/self_attn/o_proj/Linear", "inputIndexes": [ 3517 ] , "outputIndexes": [ 3518 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 110865322, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3518 ] , "outputIndexes": [ 3519 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3519 ] , "outputIndexes": [ 2618 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_143_output_0", "inputIndexes": [ 2538, 2618 ] , "outputIndexes": [ 2619 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_28/Mul_1_output_0", "inputIndexes": [ 2619 ] , "outputIndexes": [ 2620 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 111238832, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2620 ] , "outputIndexes": [ 3520 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3520 ] , "outputIndexes": [ 3521 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/mlp/gate_proj/Linear", "inputIndexes": [ 3521 ] , "outputIndexes": [ 3522 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 111243440, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3522 ] , "outputIndexes": [ 3523 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3523 ] , "outputIndexes": [ 2621 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_28/Mul_output_0", "inputIndexes": [ 2621 ] , "outputIndexes": [ 2622 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/mlp/up_proj/Linear", "inputIndexes": [ 3521 ] , "outputIndexes": [ 3526 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 112239030, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3526 ] , "outputIndexes": [ 3527 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3527 ] , "outputIndexes": [ 2623 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_28/Mul_output_0", "inputIndexes": [ 2622, 2623 ] , "outputIndexes": [ 2624 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2624 ] , "outputIndexes": [ 3528 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3528 ] , "outputIndexes": [ 3529 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.28/mlp/down_proj/Linear", "inputIndexes": [ 3529 ] , "outputIndexes": [ 3530 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 113234620, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.28/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3530 ] , "outputIndexes": [ 3531 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.28/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3531 ] , "outputIndexes": [ 2625 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_144_output_0", "inputIndexes": [ 2619, 2625 ] , "outputIndexes": [ 2626 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_261_output_0", "inputIndexes": [ 2626, 3 ] , "outputIndexes": [ 2627 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/input_layernorm_29/Mul_1_output_0", "inputIndexes": [ 2627 ] , "outputIndexes": [ 2628 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 114174914, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/q_proj/Linear/pre_reshape", "inputIndexes": [ 2628 ] , "outputIndexes": [ 3532 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/q_proj/Linear/pre_convert", "inputIndexes": [ 3532 ] , "outputIndexes": [ 3533 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/self_attn/q_proj/Linear", "inputIndexes": [ 3533 ] , "outputIndexes": [ 3534 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 114179522, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/q_proj/Linear/post_convert", "inputIndexes": [ 3534 ] , "outputIndexes": [ 3535 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/q_proj/Linear/post_reshape", "inputIndexes": [ 3535 ] , "outputIndexes": [ 2629 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_406_output_0", "inputIndexes": [ 2628 ] , "outputIndexes": [ 2630 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10867", "inputIndexes": [ 2630 ] , "outputIndexes": [ 2631 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10869", "inputIndexes": [ 2630 ] , "outputIndexes": [ 2632 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10871", "inputIndexes": [ 2632, 2632 ] , "outputIndexes": [ 2633 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10872", "inputIndexes": [ 2633 ] , "outputIndexes": [ 2634 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10874", "inputIndexes": [ 2633, 12 ] , "outputIndexes": [ 2635 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10875", "inputIndexes": [ 2635 ] , "outputIndexes": [ 2636 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10878", "inputIndexes": [ 2631, 2634, 2636, 15 ] , "outputIndexes": [ 2637 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10879", "inputIndexes": [ 2637 ] , "outputIndexes": [ 2638 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10881", "inputIndexes": [ 2638, 2638 ] , "outputIndexes": [ 2639 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_438_output_0", "inputIndexes": [ 2630, 2639, 2633 ] , "outputIndexes": [ 2640 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_928_output_0", "inputIndexes": [ 2640, 20 ] , "outputIndexes": [ 2641 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10889", "inputIndexes": [ 2633 ] , "outputIndexes": [ 2642 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10892", "inputIndexes": [ 2635 ] , "outputIndexes": [ 2643 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10895", "inputIndexes": [ 2631, 2642, 2643, 15 ] , "outputIndexes": [ 2644 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10896", "inputIndexes": [ 2644 ] , "outputIndexes": [ 2645 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10897", "inputIndexes": [ 12, 2645 ] , "outputIndexes": [ 2646 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10898", "inputIndexes": [ 2646, 2645 ] , "outputIndexes": [ 2647 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_439_output_0", "inputIndexes": [ 2630, 2647, 2633 ] , "outputIndexes": [ 2648 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_929_output_0", "inputIndexes": [ 2648, 20 ] , "outputIndexes": [ 2649 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_377_output_0", "inputIndexes": [ 2641, 2649, 30, 31 ] , "outputIndexes": [ 2650 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_262_output_0", "inputIndexes": [ 2629, 2650 ] , "outputIndexes": [ 2651 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_232_output_0", "inputIndexes": [ 2651, 58 ] , "outputIndexes": [ 2652 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_408_output_0", "inputIndexes": [ 2651 ] , "outputIndexes": [ 2653 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10967", "inputIndexes": [ 2653 ] , "outputIndexes": [ 2654 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10969", "inputIndexes": [ 2653 ] , "outputIndexes": [ 2655 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10971", "inputIndexes": [ 2655, 2655 ] , "outputIndexes": [ 2656 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10972", "inputIndexes": [ 2656 ] , "outputIndexes": [ 2657 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10974", "inputIndexes": [ 2656, 12 ] , "outputIndexes": [ 2658 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10975", "inputIndexes": [ 2658 ] , "outputIndexes": [ 2659 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10978", "inputIndexes": [ 2654, 2657, 2659, 15 ] , "outputIndexes": [ 2660 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10979", "inputIndexes": [ 2660 ] , "outputIndexes": [ 2661 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10980", "inputIndexes": [ 61, 2661 ] , "outputIndexes": [ 2662 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10981", "inputIndexes": [ 2662, 2661 ] , "outputIndexes": [ 2663 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_440_output_0", "inputIndexes": [ 2653, 2663, 2656 ] , "outputIndexes": [ 2664 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_87_output_0", "inputIndexes": [ 2664, 73 ] , "outputIndexes": [ 2665 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_935_output_0", "inputIndexes": [ 2665, 20 ] , "outputIndexes": [ 2666 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_117_output_0", "inputIndexes": [ 2651, 2666, 76, 77, 15 ] , "outputIndexes": [ 2667 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_58_output_0", "inputIndexes": [ 2667 ] , "outputIndexes": [ 2668 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_934_output_0", "inputIndexes": [ 2665, 20 ] , "outputIndexes": [ 2669 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_116_output_0", "inputIndexes": [ 2651, 20, 2669, 77, 15 ] , "outputIndexes": [ 2670 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_380_output_0", "inputIndexes": [ 2668, 2670 ] , "outputIndexes": [ 2671 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_233_output_0", "inputIndexes": [ 2671, 89 ] , "outputIndexes": [ 2672 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_145_output_0", "inputIndexes": [ 2652, 2672 ] , "outputIndexes": [ 2673 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/self_attn/k_proj/Linear", "inputIndexes": [ 3533 ] , "outputIndexes": [ 3538 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 114553032, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/k_proj/Linear/post_convert", "inputIndexes": [ 3538 ] , "outputIndexes": [ 3539 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/k_proj/Linear/post_reshape", "inputIndexes": [ 3539 ] , "outputIndexes": [ 2674 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_930_output_0", "inputIndexes": [ 2640, 20 ] , "outputIndexes": [ 2675 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_931_output_0", "inputIndexes": [ 2648, 20 ] , "outputIndexes": [ 2676 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_378_output_0", "inputIndexes": [ 2675, 2676, 77, 31 ] , "outputIndexes": [ 2677 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_263_output_0", "inputIndexes": [ 2674, 2677 ] , "outputIndexes": [ 2678 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_234_output_0", "inputIndexes": [ 2678, 58 ] , "outputIndexes": [ 2679 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Shape", "name": "/Shape_409_output_0", "inputIndexes": [ 2678 ] , "outputIndexes": [ 2680 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Shape", "name": "Shape10905", "inputIndexes": [ 2680 ] , "outputIndexes": [ 2681 ] , "main_type": "NONE", "defaultDimentionFormat": "NCHW" } , { "type": "Rank", "name": "Rank10907", "inputIndexes": [ 2680 ] , "outputIndexes": [ 2682 ] , "main_type": "NONE", "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10909", "inputIndexes": [ 2682, 2682 ] , "outputIndexes": [ 2683 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10910", "inputIndexes": [ 2683 ] , "outputIndexes": [ 2684 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10912", "inputIndexes": [ 2683, 12 ] , "outputIndexes": [ 2685 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "Unsqueeze10913", "inputIndexes": [ 2685 ] , "outputIndexes": [ 2686 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "StridedSlice10916", "inputIndexes": [ 2681, 2684, 2686, 15 ] , "outputIndexes": [ 2687 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Squeeze", "name": "Squeeze10917", "inputIndexes": [ 2687 ] , "outputIndexes": [ 2688 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10918", "inputIndexes": [ 61, 2688 ] , "outputIndexes": [ 2689 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "BinaryOp10919", "inputIndexes": [ 2689, 2688 ] , "outputIndexes": [ 2690 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "GatherV2", "name": "/Gather_441_output_0", "inputIndexes": [ 2680, 2690, 2683 ] , "outputIndexes": [ 2691 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Div_88_output_0", "inputIndexes": [ 2691, 73 ] , "outputIndexes": [ 2692 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_937_output_0", "inputIndexes": [ 2692, 20 ] , "outputIndexes": [ 2693 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_119_output_0", "inputIndexes": [ 2678, 2693, 76, 77, 15 ] , "outputIndexes": [ 2694 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/Neg_59_output_0", "inputIndexes": [ 2694 ] , "outputIndexes": [ 2695 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_936_output_0", "inputIndexes": [ 2692, 20 ] , "outputIndexes": [ 2696 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/Slice_118_output_0", "inputIndexes": [ 2678, 20, 2696, 77, 15 ] , "outputIndexes": [ 2697 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_381_output_0", "inputIndexes": [ 2695, 2697 ] , "outputIndexes": [ 2698 ] , "main_type": "Axis", "main": { "axis": -1 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Mul_235_output_0", "inputIndexes": [ 2698, 89 ] , "outputIndexes": [ 2699 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_146_output_0", "inputIndexes": [ 2679, 2699 ] , "outputIndexes": [ 2700 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/self_attn/v_proj/Linear", "inputIndexes": [ 3533 ] , "outputIndexes": [ 3542 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 192, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 768, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 114677710, 110854, 13824, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/v_proj/Linear/post_convert", "inputIndexes": [ 3542 ] , "outputIndexes": [ 3543 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/v_proj/Linear/post_reshape", "inputIndexes": [ 3543 ] , "outputIndexes": [ 2701 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 192 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_932_output_0", "inputIndexes": [ 2640, 20 ] , "outputIndexes": [ 2702 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Unsqueeze", "name": "/Unsqueeze_933_output_0", "inputIndexes": [ 2648, 20 ] , "outputIndexes": [ 2703 ] , "main_type": "SqueezeParam", "main": { } , "defaultDimentionFormat": "NHWC" } , { "type": "Concat", "name": "/Concat_379_output_0", "inputIndexes": [ 2702, 2703, 77, 31 ] , "outputIndexes": [ 2704 ] , "main_type": "Axis", "main": { "axis": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/Reshape_264_output_0", "inputIndexes": [ 2701, 2704 ] , "outputIndexes": [ 2705 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Attention", "name": "Attention/Reshape_269_output_0", "inputIndexes": [ 2673, 2700, 2705, 124 ] , "outputIndexes": [ 2706 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/o_proj/Linear/pre_reshape", "inputIndexes": [ 2706 ] , "outputIndexes": [ 3544 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/o_proj/Linear/pre_convert", "inputIndexes": [ 3544 ] , "outputIndexes": [ 3545 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/self_attn/o_proj/Linear", "inputIndexes": [ 3545 ] , "outputIndexes": [ 3546 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2304, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 114802388, 332038, 41472, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/self_attn/o_proj/Linear/post_convert", "inputIndexes": [ 3546 ] , "outputIndexes": [ 3547 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/self_attn/o_proj/Linear/post_reshape", "inputIndexes": [ 3547 ] , "outputIndexes": [ 2707 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_148_output_0", "inputIndexes": [ 2627, 2707 ] , "outputIndexes": [ 2708 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/post_attention_layernorm_29/Mul_1_output_0", "inputIndexes": [ 2708 ] , "outputIndexes": [ 2709 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 115175898, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/mlp/gate_proj/Linear/pre_reshape", "inputIndexes": [ 2709 ] , "outputIndexes": [ 3548 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/mlp/gate_proj/Linear/pre_convert", "inputIndexes": [ 3548 ] , "outputIndexes": [ 3549 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/mlp/gate_proj/Linear", "inputIndexes": [ 3549 ] , "outputIndexes": [ 3550 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 115180506, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/mlp/gate_proj/Linear/post_convert", "inputIndexes": [ 3550 ] , "outputIndexes": [ 3551 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/mlp/gate_proj/Linear/post_reshape", "inputIndexes": [ 3551 ] , "outputIndexes": [ 2710 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "UnaryOp", "name": "/mlp/act_fn_29/Mul_output_0", "inputIndexes": [ 2710 ] , "outputIndexes": [ 2711 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/mlp/up_proj/Linear", "inputIndexes": [ 3549 ] , "outputIndexes": [ 3554 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 1536, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6144, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 116176096, 884998, 110592, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/mlp/up_proj/Linear/post_convert", "inputIndexes": [ 3554 ] , "outputIndexes": [ 3555 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/mlp/up_proj/Linear/post_reshape", "inputIndexes": [ 3555 ] , "outputIndexes": [ 2712 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 1536 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/mlp_29/Mul_output_0", "inputIndexes": [ 2711, 2712 ] , "outputIndexes": [ 2713 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/mlp/down_proj/Linear/pre_reshape", "inputIndexes": [ 2713 ] , "outputIndexes": [ 3556 ] , "main_type": "Reshape", "main": { "dims": [ -1, 1536, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/mlp/down_proj/Linear/pre_convert", "inputIndexes": [ 3556 ] , "outputIndexes": [ 3557 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/layers.29/mlp/down_proj/Linear", "inputIndexes": [ 3557 ] , "outputIndexes": [ 3558 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 576, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 1536, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 6912, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 117171686, 884998, 55296, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/layers.29/mlp/down_proj/Linear/post_convert", "inputIndexes": [ 3558 ] , "outputIndexes": [ 3559 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/layers.29/mlp/down_proj/Linear/post_reshape", "inputIndexes": [ 3559 ] , "outputIndexes": [ 2714 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 576 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "BinaryOp", "name": "/Add_149_output_0", "inputIndexes": [ 2708, 2714 ] , "outputIndexes": [ 2715 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "defaultDimentionFormat": "NHWC" } , { "type": "StridedSlice", "name": "/lm/Slice_output_0", "inputIndexes": [ 2715, 2716, 76, 15, 15 ] , "outputIndexes": [ 2717 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "defaultDimentionFormat": "NHWC" } , { "type": "LayerNorm", "name": "/lm/norm/Mul_1_output_0", "inputIndexes": [ 2717 ] , "outputIndexes": [ 2718 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.00001, "group": 1, "external": [ 118111980, 2304, 2304 ] , "useRMSNorm": true } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/lm/lm_head/Linear/pre_reshape", "inputIndexes": [ 2718 ] , "outputIndexes": [ 3560 ] , "main_type": "Reshape", "main": { "dims": [ -1, 576, 1, 1 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/lm/lm_head/Linear/pre_convert", "inputIndexes": [ 3560 ] , "outputIndexes": [ 3561 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "defaultDimentionFormat": "NHWC" } , { "type": "Convolution", "name": "/lm/lm_head/Linear", "inputIndexes": [ 3561 ] , "outputIndexes": [ 3562 ] , "main_type": "Convolution2D", "main": { "common": { "dilateX": 1, "dilateY": 1, "strideX": 1, "strideY": 1, "kernelX": 1, "kernelY": 1, "padX": 0, "padY": 0, "group": 1, "outputCount": 49280, "relu": false, "padMode": "CAFFE", "relu6": false, "inputCount": 576, "hasOutputShape": false } , "quanParameter": { "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 197120, "has_scaleInt": false, "type": 1, "useInt32": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 118116588, 28385542, 3548160, 0, 0 ] } , "defaultDimentionFormat": "NHWC" } , { "type": "ConvertTensor", "name": "/lm/lm_head/Linear/post_convert", "inputIndexes": [ 3562 ] , "outputIndexes": [ 3563 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "defaultDimentionFormat": "NHWC" } , { "type": "Reshape", "name": "/lm/lm_head/Linear/post_reshape", "inputIndexes": [ 3563 ] , "outputIndexes": [ 2719 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 49280 ] , "dimType": "NCHW" } , "defaultDimentionFormat": "NHWC" } ] , "tensorName": [ "past_key_values", "presents", "input_ids", "/Constant_output_0", "/Reshape_output_0", "/input_layernorm/Mul_1_output_0", "/FakeLinear_output_0", "/Shape_output_0", "Shape51", "BinaryOp54", "BinaryOp55", "Unsqueeze56", "Const9", "BinaryOp58", "Unsqueeze59", "Unsqueeze61", "StridedSlice62", "BinaryOp64", "BinaryOp65", "/Gather_1_output_0", "/rotary/Constant_4_output_0", "/Unsqueeze_output_0", "Unsqueeze75", "Unsqueeze78", "StridedSlice81", "Squeeze82", "BinaryOp83", "BinaryOp84", "/Gather_2_output_0", "/Unsqueeze_1_output_0", "/Constant_4_output_0", "/Constant_5_output_0", "/Concat_output_0", "/Reshape_1_output_0", "position_ids", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_2_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_7_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape107", "BinaryOp110", "BinaryOp111", "Unsqueeze112", "BinaryOp114", "Unsqueeze115", "StridedSlice118", "BinaryOp120", "BinaryOp121", "/Gather_3_output_0", "/Mul_output_0", "/Shape_2_output_0", "/Constant_6_output_0", "Shape238", "BinaryOp241", "BinaryOp242", "Unsqueeze243", "BinaryOp245", "Unsqueeze246", "StridedSlice249", "Squeeze250", "BinaryOp251", "BinaryOp252", "/Gather_5_output_0", "/rotary/Constant_6_output_0", "/Div_output_0", "/Unsqueeze_7_output_0", "/Constant_19_output_0", "/Constant_7_output_0", "/Slice_1_output_0", "/Neg_output_0", "/Unsqueeze_6_output_0", "/Slice_output_0", "/Concat_3_output_0", "Unsqueeze157", "Unsqueeze160", "StridedSlice163", "Squeeze164", "BinaryOp165", "BinaryOp166", "/Gather_4_output_0", "/Mul_1_output_0", "/Add_output_0", "/FakeLinear_1_output_0", "/Unsqueeze_2_output_0", "/Unsqueeze_3_output_0", "/Concat_1_output_0", "/Reshape_2_output_0", "/Mul_2_output_0", "/Shape_3_output_0", "Shape126", "BinaryOp129", "BinaryOp130", "Unsqueeze131", "BinaryOp133", "Unsqueeze134", "StridedSlice137", "Squeeze138", "BinaryOp139", "BinaryOp140", "/Gather_6_output_0", "/Div_1_output_0", "/Unsqueeze_9_output_0", "/Slice_3_output_0", "/Neg_1_output_0", "/Unsqueeze_8_output_0", "/Slice_2_output_0", "/Concat_4_output_0", "/Mul_3_output_0", "/Add_1_output_0", "/FakeLinear_2_output_0", "/Unsqueeze_4_output_0", "/Unsqueeze_5_output_0", "/Concat_2_output_0", "/Reshape_3_output_0", "attention_mask", "/Reshape_8_output_0", "/FakeLinear_3_output_0", "/Add_3_output_0", "/post_attention_layernorm/Mul_1_output_0", "/mlp/gate_proj/FakeLinear_output_0", "/mlp/act_fn/Mul_output_0", "/mlp/up_proj/FakeLinear_output_0", "/mlp/Mul_output_0", "/mlp/down_proj/FakeLinear_output_0", "/Add_4_output_0", "/Reshape_9_output_0", "/input_layernorm_1/Mul_1_output_0", "/FakeLinear_4_output_0", "/Shape_14_output_0", "Shape481", "BinaryOp484", "BinaryOp485", "Unsqueeze486", "BinaryOp488", "Unsqueeze489", "StridedSlice492", "BinaryOp494", "BinaryOp495", "/Gather_18_output_0", "/Unsqueeze_32_output_0", "Unsqueeze503", "Unsqueeze506", "StridedSlice509", "Squeeze510", "BinaryOp511", "BinaryOp512", "/Gather_19_output_0", "/Unsqueeze_33_output_0", "/Concat_13_output_0", "/Reshape_10_output_0", "/Mul_8_output_0", "/Shape_16_output_0", "Shape612", "BinaryOp615", "BinaryOp616", "Unsqueeze617", "BinaryOp619", "Unsqueeze620", "StridedSlice623", "Squeeze624", "BinaryOp625", "BinaryOp626", "/Gather_20_output_0", "/Div_3_output_0", "/Unsqueeze_39_output_0", "/Slice_5_output_0", "/Neg_2_output_0", "/Unsqueeze_38_output_0", "/Slice_4_output_0", "/Concat_16_output_0", "/Mul_9_output_0", "/Add_5_output_0", "/FakeLinear_5_output_0", "/Unsqueeze_34_output_0", "/Unsqueeze_35_output_0", "/Concat_14_output_0", "/Reshape_11_output_0", "/Mul_10_output_0", "/Shape_17_output_0", "Shape519", "BinaryOp522", "BinaryOp523", "Unsqueeze524", "BinaryOp526", "Unsqueeze527", "StridedSlice530", "Squeeze531", "BinaryOp532", "BinaryOp533", "/Gather_21_output_0", "/Div_4_output_0", "/Unsqueeze_41_output_0", "/Slice_7_output_0", "/Neg_3_output_0", "/Unsqueeze_40_output_0", "/Slice_6_output_0", "/Concat_17_output_0", "/Mul_11_output_0", "/Add_6_output_0", "/FakeLinear_6_output_0", "/Unsqueeze_36_output_0", "/Unsqueeze_37_output_0", "/Concat_15_output_0", "/Reshape_12_output_0", "/Reshape_17_output_0", "/FakeLinear_7_output_0", "/Add_8_output_0", "/post_attention_layernorm_1/Mul_1_output_0", "/mlp/gate_proj_1/FakeLinear_output_0", "/mlp/act_fn_1/Mul_output_0", "/mlp/up_proj_1/FakeLinear_output_0", "/mlp_1/Mul_output_0", "/mlp/down_proj_1/FakeLinear_output_0", "/Add_9_output_0", "/Reshape_18_output_0", "/input_layernorm_2/Mul_1_output_0", "/FakeLinear_8_output_0", "/Shape_28_output_0", "Shape851", "BinaryOp854", "BinaryOp855", "Unsqueeze856", "BinaryOp858", "Unsqueeze859", "StridedSlice862", "BinaryOp864", "BinaryOp865", "/Gather_33_output_0", "/Unsqueeze_64_output_0", "Unsqueeze873", "Unsqueeze876", "StridedSlice879", "Squeeze880", "BinaryOp881", "BinaryOp882", "/Gather_34_output_0", "/Unsqueeze_65_output_0", "/Concat_26_output_0", "/Reshape_19_output_0", "/Mul_16_output_0", "/Shape_30_output_0", "Shape982", "BinaryOp985", "BinaryOp986", "Unsqueeze987", "BinaryOp989", "Unsqueeze990", "StridedSlice993", "Squeeze994", "BinaryOp995", "BinaryOp996", "/Gather_35_output_0", "/Div_6_output_0", "/Unsqueeze_71_output_0", "/Slice_9_output_0", "/Neg_4_output_0", "/Unsqueeze_70_output_0", "/Slice_8_output_0", "/Concat_29_output_0", "/Mul_17_output_0", "/Add_10_output_0", "/FakeLinear_9_output_0", "/Unsqueeze_66_output_0", "/Unsqueeze_67_output_0", "/Concat_27_output_0", "/Reshape_20_output_0", "/Mul_18_output_0", "/Shape_31_output_0", "Shape889", "BinaryOp892", "BinaryOp893", "Unsqueeze894", "BinaryOp896", "Unsqueeze897", "StridedSlice900", "Squeeze901", "BinaryOp902", "BinaryOp903", "/Gather_36_output_0", "/Div_7_output_0", "/Unsqueeze_73_output_0", "/Slice_11_output_0", "/Neg_5_output_0", "/Unsqueeze_72_output_0", "/Slice_10_output_0", "/Concat_30_output_0", "/Mul_19_output_0", "/Add_11_output_0", "/FakeLinear_10_output_0", "/Unsqueeze_68_output_0", "/Unsqueeze_69_output_0", "/Concat_28_output_0", "/Reshape_21_output_0", "/Reshape_26_output_0", "/FakeLinear_11_output_0", "/Add_13_output_0", "/post_attention_layernorm_2/Mul_1_output_0", "/mlp/gate_proj_2/FakeLinear_output_0", "/mlp/act_fn_2/Mul_output_0", "/mlp/up_proj_2/FakeLinear_output_0", "/mlp_2/Mul_output_0", "/mlp/down_proj_2/FakeLinear_output_0", "/Add_14_output_0", "/Reshape_27_output_0", "/input_layernorm_3/Mul_1_output_0", "/FakeLinear_12_output_0", "/Shape_42_output_0", "Shape1221", "BinaryOp1224", "BinaryOp1225", "Unsqueeze1226", "BinaryOp1228", "Unsqueeze1229", "StridedSlice1232", "BinaryOp1234", "BinaryOp1235", "/Gather_48_output_0", "/Unsqueeze_96_output_0", "Unsqueeze1243", "Unsqueeze1246", "StridedSlice1249", "Squeeze1250", "BinaryOp1251", "BinaryOp1252", "/Gather_49_output_0", "/Unsqueeze_97_output_0", "/Concat_39_output_0", "/Reshape_28_output_0", "/Mul_24_output_0", "/Shape_44_output_0", "Shape1353", "BinaryOp1356", "BinaryOp1357", "Unsqueeze1358", "BinaryOp1360", "Unsqueeze1361", "StridedSlice1364", "Squeeze1365", "BinaryOp1366", "BinaryOp1367", "/Gather_50_output_0", "/Div_9_output_0", "/Unsqueeze_103_output_0", "/Slice_13_output_0", "/Neg_6_output_0", "/Unsqueeze_102_output_0", "/Slice_12_output_0", "/Concat_42_output_0", "/Mul_25_output_0", "/Add_15_output_0", "/FakeLinear_13_output_0", "/Unsqueeze_98_output_0", "/Unsqueeze_99_output_0", "/Concat_40_output_0", "/Reshape_29_output_0", "/Mul_26_output_0", "/Shape_45_output_0", "Shape1259", "BinaryOp1262", "BinaryOp1263", "Unsqueeze1264", "BinaryOp1266", "Unsqueeze1267", "StridedSlice1270", "Squeeze1271", "BinaryOp1272", "BinaryOp1273", "/Gather_51_output_0", "/Div_10_output_0", "/Unsqueeze_105_output_0", "/Slice_15_output_0", "/Neg_7_output_0", "/Unsqueeze_104_output_0", "/Slice_14_output_0", "/Concat_43_output_0", "/Mul_27_output_0", "/Add_16_output_0", "/FakeLinear_14_output_0", "/Unsqueeze_100_output_0", "/Unsqueeze_101_output_0", "/Concat_41_output_0", "/Reshape_30_output_0", "/Reshape_35_output_0", "/FakeLinear_15_output_0", "/Add_18_output_0", "/post_attention_layernorm_3/Mul_1_output_0", "/mlp/gate_proj_3/FakeLinear_output_0", "/mlp/act_fn_3/Mul_output_0", "/mlp/up_proj_3/FakeLinear_output_0", "/mlp_3/Mul_output_0", "/mlp/down_proj_3/FakeLinear_output_0", "/Add_19_output_0", "/Reshape_36_output_0", "/input_layernorm_4/Mul_1_output_0", "/FakeLinear_16_output_0", "/Shape_56_output_0", "Shape1592", "BinaryOp1595", "BinaryOp1596", "Unsqueeze1597", "BinaryOp1599", "Unsqueeze1600", "StridedSlice1603", "BinaryOp1605", "BinaryOp1606", "/Gather_63_output_0", "/Unsqueeze_128_output_0", "Unsqueeze1614", "Unsqueeze1617", "StridedSlice1620", "Squeeze1621", "BinaryOp1622", "BinaryOp1623", "/Gather_64_output_0", "/Unsqueeze_129_output_0", "/Concat_52_output_0", "/Reshape_37_output_0", "/Mul_32_output_0", "/Shape_58_output_0", "Shape1724", "BinaryOp1727", "BinaryOp1728", "Unsqueeze1729", "BinaryOp1731", "Unsqueeze1732", "StridedSlice1735", "Squeeze1736", "BinaryOp1737", "BinaryOp1738", "/Gather_65_output_0", "/Div_12_output_0", "/Unsqueeze_135_output_0", "/Slice_17_output_0", "/Neg_8_output_0", "/Unsqueeze_134_output_0", "/Slice_16_output_0", "/Concat_55_output_0", "/Mul_33_output_0", "/Add_20_output_0", "/FakeLinear_17_output_0", "/Unsqueeze_130_output_0", "/Unsqueeze_131_output_0", "/Concat_53_output_0", "/Reshape_38_output_0", "/Mul_34_output_0", "/Shape_59_output_0", "Shape1630", "BinaryOp1633", "BinaryOp1634", "Unsqueeze1635", "BinaryOp1637", "Unsqueeze1638", "StridedSlice1641", "Squeeze1642", "BinaryOp1643", "BinaryOp1644", "/Gather_66_output_0", "/Div_13_output_0", "/Unsqueeze_137_output_0", "/Slice_19_output_0", "/Neg_9_output_0", "/Unsqueeze_136_output_0", "/Slice_18_output_0", "/Concat_56_output_0", "/Mul_35_output_0", "/Add_21_output_0", "/FakeLinear_18_output_0", "/Unsqueeze_132_output_0", "/Unsqueeze_133_output_0", "/Concat_54_output_0", "/Reshape_39_output_0", "/Reshape_44_output_0", "/FakeLinear_19_output_0", "/Add_23_output_0", "/post_attention_layernorm_4/Mul_1_output_0", "/mlp/gate_proj_4/FakeLinear_output_0", "/mlp/act_fn_4/Mul_output_0", "/mlp/up_proj_4/FakeLinear_output_0", "/mlp_4/Mul_output_0", "/mlp/down_proj_4/FakeLinear_output_0", "/Add_24_output_0", "/Reshape_45_output_0", "/input_layernorm_5/Mul_1_output_0", "/FakeLinear_20_output_0", "/Shape_70_output_0", "Shape1963", "BinaryOp1966", "BinaryOp1967", "Unsqueeze1968", "BinaryOp1970", "Unsqueeze1971", "StridedSlice1974", "BinaryOp1976", "BinaryOp1977", "/Gather_78_output_0", "/Unsqueeze_160_output_0", "Unsqueeze1985", "Unsqueeze1988", "StridedSlice1991", "Squeeze1992", "BinaryOp1993", "BinaryOp1994", "/Gather_79_output_0", "/Unsqueeze_161_output_0", "/Concat_65_output_0", "/Reshape_46_output_0", "/Mul_40_output_0", "/Shape_72_output_0", "Shape2095", "BinaryOp2098", "BinaryOp2099", "Unsqueeze2100", "BinaryOp2102", "Unsqueeze2103", "StridedSlice2106", "Squeeze2107", "BinaryOp2108", "BinaryOp2109", "/Gather_80_output_0", "/Div_15_output_0", "/Unsqueeze_167_output_0", "/Slice_21_output_0", "/Neg_10_output_0", "/Unsqueeze_166_output_0", "/Slice_20_output_0", "/Concat_68_output_0", "/Mul_41_output_0", "/Add_25_output_0", "/FakeLinear_21_output_0", "/Unsqueeze_162_output_0", "/Unsqueeze_163_output_0", "/Concat_66_output_0", "/Reshape_47_output_0", "/Mul_42_output_0", "/Shape_73_output_0", "Shape2001", "BinaryOp2004", "BinaryOp2005", "Unsqueeze2006", "BinaryOp2008", "Unsqueeze2009", "StridedSlice2012", "Squeeze2013", "BinaryOp2014", "BinaryOp2015", "/Gather_81_output_0", "/Div_16_output_0", "/Unsqueeze_169_output_0", "/Slice_23_output_0", "/Neg_11_output_0", "/Unsqueeze_168_output_0", "/Slice_22_output_0", "/Concat_69_output_0", "/Mul_43_output_0", "/Add_26_output_0", "/FakeLinear_22_output_0", "/Unsqueeze_164_output_0", "/Unsqueeze_165_output_0", "/Concat_67_output_0", "/Reshape_48_output_0", "/Reshape_53_output_0", "/FakeLinear_23_output_0", "/Add_28_output_0", "/post_attention_layernorm_5/Mul_1_output_0", "/mlp/gate_proj_5/FakeLinear_output_0", "/mlp/act_fn_5/Mul_output_0", "/mlp/up_proj_5/FakeLinear_output_0", "/mlp_5/Mul_output_0", "/mlp/down_proj_5/FakeLinear_output_0", "/Add_29_output_0", "/Reshape_54_output_0", "/input_layernorm_6/Mul_1_output_0", "/FakeLinear_24_output_0", "/Shape_84_output_0", "Shape2334", "BinaryOp2337", "BinaryOp2338", "Unsqueeze2339", "BinaryOp2341", "Unsqueeze2342", "StridedSlice2345", "BinaryOp2347", "BinaryOp2348", "/Gather_93_output_0", "/Unsqueeze_192_output_0", "Unsqueeze2356", "Unsqueeze2359", "StridedSlice2362", "Squeeze2363", "BinaryOp2364", "BinaryOp2365", "/Gather_94_output_0", "/Unsqueeze_193_output_0", "/Concat_78_output_0", "/Reshape_55_output_0", "/Mul_48_output_0", "/Shape_86_output_0", "Shape2466", "BinaryOp2469", "BinaryOp2470", "Unsqueeze2471", "BinaryOp2473", "Unsqueeze2474", "StridedSlice2477", "Squeeze2478", "BinaryOp2479", "BinaryOp2480", "/Gather_95_output_0", "/Div_18_output_0", "/Unsqueeze_199_output_0", "/Slice_25_output_0", "/Neg_12_output_0", "/Unsqueeze_198_output_0", "/Slice_24_output_0", "/Concat_81_output_0", "/Mul_49_output_0", "/Add_30_output_0", "/FakeLinear_25_output_0", "/Unsqueeze_194_output_0", "/Unsqueeze_195_output_0", "/Concat_79_output_0", "/Reshape_56_output_0", "/Mul_50_output_0", "/Shape_87_output_0", "Shape2372", "BinaryOp2375", "BinaryOp2376", "Unsqueeze2377", "BinaryOp2379", "Unsqueeze2380", "StridedSlice2383", "Squeeze2384", "BinaryOp2385", "BinaryOp2386", "/Gather_96_output_0", "/Div_19_output_0", "/Unsqueeze_201_output_0", "/Slice_27_output_0", "/Neg_13_output_0", "/Unsqueeze_200_output_0", "/Slice_26_output_0", "/Concat_82_output_0", "/Mul_51_output_0", "/Add_31_output_0", "/FakeLinear_26_output_0", "/Unsqueeze_196_output_0", "/Unsqueeze_197_output_0", "/Concat_80_output_0", "/Reshape_57_output_0", "/Reshape_62_output_0", "/FakeLinear_27_output_0", "/Add_33_output_0", "/post_attention_layernorm_6/Mul_1_output_0", "/mlp/gate_proj_6/FakeLinear_output_0", "/mlp/act_fn_6/Mul_output_0", "/mlp/up_proj_6/FakeLinear_output_0", "/mlp_6/Mul_output_0", "/mlp/down_proj_6/FakeLinear_output_0", "/Add_34_output_0", "/Reshape_63_output_0", "/input_layernorm_7/Mul_1_output_0", "/FakeLinear_28_output_0", "/Shape_98_output_0", "Shape2705", "BinaryOp2708", "BinaryOp2709", "Unsqueeze2710", "BinaryOp2712", "Unsqueeze2713", "StridedSlice2716", "BinaryOp2718", "BinaryOp2719", "/Gather_108_output_0", "/Unsqueeze_224_output_0", "Unsqueeze2727", "Unsqueeze2730", "StridedSlice2733", "Squeeze2734", "BinaryOp2735", "BinaryOp2736", "/Gather_109_output_0", "/Unsqueeze_225_output_0", "/Concat_91_output_0", "/Reshape_64_output_0", "/Mul_56_output_0", "/Shape_100_output_0", "Shape2837", "BinaryOp2840", "BinaryOp2841", "Unsqueeze2842", "BinaryOp2844", "Unsqueeze2845", "StridedSlice2848", "Squeeze2849", "BinaryOp2850", "BinaryOp2851", "/Gather_110_output_0", "/Div_21_output_0", "/Unsqueeze_231_output_0", "/Slice_29_output_0", "/Neg_14_output_0", "/Unsqueeze_230_output_0", "/Slice_28_output_0", "/Concat_94_output_0", "/Mul_57_output_0", "/Add_35_output_0", "/FakeLinear_29_output_0", "/Unsqueeze_226_output_0", "/Unsqueeze_227_output_0", "/Concat_92_output_0", "/Reshape_65_output_0", "/Mul_58_output_0", "/Shape_101_output_0", "Shape2743", "BinaryOp2746", "BinaryOp2747", "Unsqueeze2748", "BinaryOp2750", "Unsqueeze2751", "StridedSlice2754", "Squeeze2755", "BinaryOp2756", "BinaryOp2757", "/Gather_111_output_0", "/Div_22_output_0", "/Unsqueeze_233_output_0", "/Slice_31_output_0", "/Neg_15_output_0", "/Unsqueeze_232_output_0", "/Slice_30_output_0", "/Concat_95_output_0", "/Mul_59_output_0", "/Add_36_output_0", "/FakeLinear_30_output_0", "/Unsqueeze_228_output_0", "/Unsqueeze_229_output_0", "/Concat_93_output_0", "/Reshape_66_output_0", "/Reshape_71_output_0", "/FakeLinear_31_output_0", "/Add_38_output_0", "/post_attention_layernorm_7/Mul_1_output_0", "/mlp/gate_proj_7/FakeLinear_output_0", "/mlp/act_fn_7/Mul_output_0", "/mlp/up_proj_7/FakeLinear_output_0", "/mlp_7/Mul_output_0", "/mlp/down_proj_7/FakeLinear_output_0", "/Add_39_output_0", "/Reshape_72_output_0", "/input_layernorm_8/Mul_1_output_0", "/FakeLinear_32_output_0", "/Shape_112_output_0", "Shape3076", "BinaryOp3079", "BinaryOp3080", "Unsqueeze3081", "BinaryOp3083", "Unsqueeze3084", "StridedSlice3087", "BinaryOp3089", "BinaryOp3090", "/Gather_123_output_0", "/Unsqueeze_256_output_0", "Unsqueeze3098", "Unsqueeze3101", "StridedSlice3104", "Squeeze3105", "BinaryOp3106", "BinaryOp3107", "/Gather_124_output_0", "/Unsqueeze_257_output_0", "/Concat_104_output_0", "/Reshape_73_output_0", "/Mul_64_output_0", "/Shape_114_output_0", "Shape3208", "BinaryOp3211", "BinaryOp3212", "Unsqueeze3213", "BinaryOp3215", "Unsqueeze3216", "StridedSlice3219", "Squeeze3220", "BinaryOp3221", "BinaryOp3222", "/Gather_125_output_0", "/Div_24_output_0", "/Unsqueeze_263_output_0", "/Slice_33_output_0", "/Neg_16_output_0", "/Unsqueeze_262_output_0", "/Slice_32_output_0", "/Concat_107_output_0", "/Mul_65_output_0", "/Add_40_output_0", "/FakeLinear_33_output_0", "/Unsqueeze_258_output_0", "/Unsqueeze_259_output_0", "/Concat_105_output_0", "/Reshape_74_output_0", "/Mul_66_output_0", "/Shape_115_output_0", "Shape3114", "BinaryOp3117", "BinaryOp3118", "Unsqueeze3119", "BinaryOp3121", "Unsqueeze3122", "StridedSlice3125", "Squeeze3126", "BinaryOp3127", "BinaryOp3128", "/Gather_126_output_0", "/Div_25_output_0", "/Unsqueeze_265_output_0", "/Slice_35_output_0", "/Neg_17_output_0", "/Unsqueeze_264_output_0", "/Slice_34_output_0", "/Concat_108_output_0", "/Mul_67_output_0", "/Add_41_output_0", "/FakeLinear_34_output_0", "/Unsqueeze_260_output_0", "/Unsqueeze_261_output_0", "/Concat_106_output_0", "/Reshape_75_output_0", "/Reshape_80_output_0", "/FakeLinear_35_output_0", "/Add_43_output_0", "/post_attention_layernorm_8/Mul_1_output_0", "/mlp/gate_proj_8/FakeLinear_output_0", "/mlp/act_fn_8/Mul_output_0", "/mlp/up_proj_8/FakeLinear_output_0", "/mlp_8/Mul_output_0", "/mlp/down_proj_8/FakeLinear_output_0", "/Add_44_output_0", "/Reshape_81_output_0", "/input_layernorm_9/Mul_1_output_0", "/FakeLinear_36_output_0", "/Shape_126_output_0", "Shape3447", "BinaryOp3450", "BinaryOp3451", "Unsqueeze3452", "BinaryOp3454", "Unsqueeze3455", "StridedSlice3458", "BinaryOp3460", "BinaryOp3461", "/Gather_138_output_0", "/Unsqueeze_288_output_0", "Unsqueeze3469", "Unsqueeze3472", "StridedSlice3475", "Squeeze3476", "BinaryOp3477", "BinaryOp3478", "/Gather_139_output_0", "/Unsqueeze_289_output_0", "/Concat_117_output_0", "/Reshape_82_output_0", "/Mul_72_output_0", "/Shape_128_output_0", "Shape3579", "BinaryOp3582", "BinaryOp3583", "Unsqueeze3584", "BinaryOp3586", "Unsqueeze3587", "StridedSlice3590", "Squeeze3591", "BinaryOp3592", "BinaryOp3593", "/Gather_140_output_0", "/Div_27_output_0", "/Unsqueeze_295_output_0", "/Slice_37_output_0", "/Neg_18_output_0", "/Unsqueeze_294_output_0", "/Slice_36_output_0", "/Concat_120_output_0", "/Mul_73_output_0", "/Add_45_output_0", "/FakeLinear_37_output_0", "/Unsqueeze_290_output_0", "/Unsqueeze_291_output_0", "/Concat_118_output_0", "/Reshape_83_output_0", "/Mul_74_output_0", "/Shape_129_output_0", "Shape3485", "BinaryOp3488", "BinaryOp3489", "Unsqueeze3490", "BinaryOp3492", "Unsqueeze3493", "StridedSlice3496", "Squeeze3497", "BinaryOp3498", "BinaryOp3499", "/Gather_141_output_0", "/Div_28_output_0", "/Unsqueeze_297_output_0", "/Slice_39_output_0", "/Neg_19_output_0", "/Unsqueeze_296_output_0", "/Slice_38_output_0", "/Concat_121_output_0", "/Mul_75_output_0", "/Add_46_output_0", "/FakeLinear_38_output_0", "/Unsqueeze_292_output_0", "/Unsqueeze_293_output_0", "/Concat_119_output_0", "/Reshape_84_output_0", "/Reshape_89_output_0", "/FakeLinear_39_output_0", "/Add_48_output_0", "/post_attention_layernorm_9/Mul_1_output_0", "/mlp/gate_proj_9/FakeLinear_output_0", "/mlp/act_fn_9/Mul_output_0", "/mlp/up_proj_9/FakeLinear_output_0", "/mlp_9/Mul_output_0", "/mlp/down_proj_9/FakeLinear_output_0", "/Add_49_output_0", "/Reshape_90_output_0", "/input_layernorm_10/Mul_1_output_0", "/FakeLinear_40_output_0", "/Shape_140_output_0", "Shape3818", "BinaryOp3821", "BinaryOp3822", "Unsqueeze3823", "BinaryOp3825", "Unsqueeze3826", "StridedSlice3829", "BinaryOp3831", "BinaryOp3832", "/Gather_153_output_0", "/Unsqueeze_320_output_0", "Unsqueeze3840", "Unsqueeze3843", "StridedSlice3846", "Squeeze3847", "BinaryOp3848", "BinaryOp3849", "/Gather_154_output_0", "/Unsqueeze_321_output_0", "/Concat_130_output_0", "/Reshape_91_output_0", "/Mul_80_output_0", "/Shape_142_output_0", "Shape3950", "BinaryOp3953", "BinaryOp3954", "Unsqueeze3955", "BinaryOp3957", "Unsqueeze3958", "StridedSlice3961", "Squeeze3962", "BinaryOp3963", "BinaryOp3964", "/Gather_155_output_0", "/Div_30_output_0", "/Unsqueeze_327_output_0", "/Slice_41_output_0", "/Neg_20_output_0", "/Unsqueeze_326_output_0", "/Slice_40_output_0", "/Concat_133_output_0", "/Mul_81_output_0", "/Add_50_output_0", "/FakeLinear_41_output_0", "/Unsqueeze_322_output_0", "/Unsqueeze_323_output_0", "/Concat_131_output_0", "/Reshape_92_output_0", "/Mul_82_output_0", "/Shape_143_output_0", "Shape3856", "BinaryOp3859", "BinaryOp3860", "Unsqueeze3861", "BinaryOp3863", "Unsqueeze3864", "StridedSlice3867", "Squeeze3868", "BinaryOp3869", "BinaryOp3870", "/Gather_156_output_0", "/Div_31_output_0", "/Unsqueeze_329_output_0", "/Slice_43_output_0", "/Neg_21_output_0", "/Unsqueeze_328_output_0", "/Slice_42_output_0", "/Concat_134_output_0", "/Mul_83_output_0", "/Add_51_output_0", "/FakeLinear_42_output_0", "/Unsqueeze_324_output_0", "/Unsqueeze_325_output_0", "/Concat_132_output_0", "/Reshape_93_output_0", "/Reshape_98_output_0", "/FakeLinear_43_output_0", "/Add_53_output_0", "/post_attention_layernorm_10/Mul_1_output_0", "/mlp/gate_proj_10/FakeLinear_output_0", "/mlp/act_fn_10/Mul_output_0", "/mlp/up_proj_10/FakeLinear_output_0", "/mlp_10/Mul_output_0", "/mlp/down_proj_10/FakeLinear_output_0", "/Add_54_output_0", "/Reshape_99_output_0", "/input_layernorm_11/Mul_1_output_0", "/FakeLinear_44_output_0", "/Shape_154_output_0", "Shape4189", "BinaryOp4192", "BinaryOp4193", "Unsqueeze4194", "BinaryOp4196", "Unsqueeze4197", "StridedSlice4200", "BinaryOp4202", "BinaryOp4203", "/Gather_168_output_0", "/Unsqueeze_352_output_0", "Unsqueeze4211", "Unsqueeze4214", "StridedSlice4217", "Squeeze4218", "BinaryOp4219", "BinaryOp4220", "/Gather_169_output_0", "/Unsqueeze_353_output_0", "/Concat_143_output_0", "/Reshape_100_output_0", "/Mul_88_output_0", "/Shape_156_output_0", "Shape4321", "BinaryOp4324", "BinaryOp4325", "Unsqueeze4326", "BinaryOp4328", "Unsqueeze4329", "StridedSlice4332", "Squeeze4333", "BinaryOp4334", "BinaryOp4335", "/Gather_170_output_0", "/Div_33_output_0", "/Unsqueeze_359_output_0", "/Slice_45_output_0", "/Neg_22_output_0", "/Unsqueeze_358_output_0", "/Slice_44_output_0", "/Concat_146_output_0", "/Mul_89_output_0", "/Add_55_output_0", "/FakeLinear_45_output_0", "/Unsqueeze_354_output_0", "/Unsqueeze_355_output_0", "/Concat_144_output_0", "/Reshape_101_output_0", "/Mul_90_output_0", "/Shape_157_output_0", "Shape4227", "BinaryOp4230", "BinaryOp4231", "Unsqueeze4232", "BinaryOp4234", "Unsqueeze4235", "StridedSlice4238", "Squeeze4239", "BinaryOp4240", "BinaryOp4241", "/Gather_171_output_0", "/Div_34_output_0", "/Unsqueeze_361_output_0", "/Slice_47_output_0", "/Neg_23_output_0", "/Unsqueeze_360_output_0", "/Slice_46_output_0", "/Concat_147_output_0", "/Mul_91_output_0", "/Add_56_output_0", "/FakeLinear_46_output_0", "/Unsqueeze_356_output_0", "/Unsqueeze_357_output_0", "/Concat_145_output_0", "/Reshape_102_output_0", "/Reshape_107_output_0", "/FakeLinear_47_output_0", "/Add_58_output_0", "/post_attention_layernorm_11/Mul_1_output_0", "/mlp/gate_proj_11/FakeLinear_output_0", "/mlp/act_fn_11/Mul_output_0", "/mlp/up_proj_11/FakeLinear_output_0", "/mlp_11/Mul_output_0", "/mlp/down_proj_11/FakeLinear_output_0", "/Add_59_output_0", "/Reshape_108_output_0", "/input_layernorm_12/Mul_1_output_0", "/FakeLinear_48_output_0", "/Shape_168_output_0", "Shape4560", "BinaryOp4563", "BinaryOp4564", "Unsqueeze4565", "BinaryOp4567", "Unsqueeze4568", "StridedSlice4571", "BinaryOp4573", "BinaryOp4574", "/Gather_183_output_0", "/Unsqueeze_384_output_0", "Unsqueeze4582", "Unsqueeze4585", "StridedSlice4588", "Squeeze4589", "BinaryOp4590", "BinaryOp4591", "/Gather_184_output_0", "/Unsqueeze_385_output_0", "/Concat_156_output_0", "/Reshape_109_output_0", "/Mul_96_output_0", "/Shape_170_output_0", "Shape4692", "BinaryOp4695", "BinaryOp4696", "Unsqueeze4697", "BinaryOp4699", "Unsqueeze4700", "StridedSlice4703", "Squeeze4704", "BinaryOp4705", "BinaryOp4706", "/Gather_185_output_0", "/Div_36_output_0", "/Unsqueeze_391_output_0", "/Slice_49_output_0", "/Neg_24_output_0", "/Unsqueeze_390_output_0", "/Slice_48_output_0", "/Concat_159_output_0", "/Mul_97_output_0", "/Add_60_output_0", "/FakeLinear_49_output_0", "/Unsqueeze_386_output_0", "/Unsqueeze_387_output_0", "/Concat_157_output_0", "/Reshape_110_output_0", "/Mul_98_output_0", "/Shape_171_output_0", "Shape4598", "BinaryOp4601", "BinaryOp4602", "Unsqueeze4603", "BinaryOp4605", "Unsqueeze4606", "StridedSlice4609", "Squeeze4610", "BinaryOp4611", "BinaryOp4612", "/Gather_186_output_0", "/Div_37_output_0", "/Unsqueeze_393_output_0", "/Slice_51_output_0", "/Neg_25_output_0", "/Unsqueeze_392_output_0", "/Slice_50_output_0", "/Concat_160_output_0", "/Mul_99_output_0", "/Add_61_output_0", "/FakeLinear_50_output_0", "/Unsqueeze_388_output_0", "/Unsqueeze_389_output_0", "/Concat_158_output_0", "/Reshape_111_output_0", "/Reshape_116_output_0", "/FakeLinear_51_output_0", "/Add_63_output_0", "/post_attention_layernorm_12/Mul_1_output_0", "/mlp/gate_proj_12/FakeLinear_output_0", "/mlp/act_fn_12/Mul_output_0", "/mlp/up_proj_12/FakeLinear_output_0", "/mlp_12/Mul_output_0", "/mlp/down_proj_12/FakeLinear_output_0", "/Add_64_output_0", "/Reshape_117_output_0", "/input_layernorm_13/Mul_1_output_0", "/FakeLinear_52_output_0", "/Shape_182_output_0", "Shape4931", "BinaryOp4934", "BinaryOp4935", "Unsqueeze4936", "BinaryOp4938", "Unsqueeze4939", "StridedSlice4942", "BinaryOp4944", "BinaryOp4945", "/Gather_198_output_0", "/Unsqueeze_416_output_0", "Unsqueeze4953", "Unsqueeze4956", "StridedSlice4959", "Squeeze4960", "BinaryOp4961", "BinaryOp4962", "/Gather_199_output_0", "/Unsqueeze_417_output_0", "/Concat_169_output_0", "/Reshape_118_output_0", "/Mul_104_output_0", "/Shape_184_output_0", "Shape5063", "BinaryOp5066", "BinaryOp5067", "Unsqueeze5068", "BinaryOp5070", "Unsqueeze5071", "StridedSlice5074", "Squeeze5075", "BinaryOp5076", "BinaryOp5077", "/Gather_200_output_0", "/Div_39_output_0", "/Unsqueeze_423_output_0", "/Slice_53_output_0", "/Neg_26_output_0", "/Unsqueeze_422_output_0", "/Slice_52_output_0", "/Concat_172_output_0", "/Mul_105_output_0", "/Add_65_output_0", "/FakeLinear_53_output_0", "/Unsqueeze_418_output_0", "/Unsqueeze_419_output_0", "/Concat_170_output_0", "/Reshape_119_output_0", "/Mul_106_output_0", "/Shape_185_output_0", "Shape4969", "BinaryOp4972", "BinaryOp4973", "Unsqueeze4974", "BinaryOp4976", "Unsqueeze4977", "StridedSlice4980", "Squeeze4981", "BinaryOp4982", "BinaryOp4983", "/Gather_201_output_0", "/Div_40_output_0", "/Unsqueeze_425_output_0", "/Slice_55_output_0", "/Neg_27_output_0", "/Unsqueeze_424_output_0", "/Slice_54_output_0", "/Concat_173_output_0", "/Mul_107_output_0", "/Add_66_output_0", "/FakeLinear_54_output_0", "/Unsqueeze_420_output_0", "/Unsqueeze_421_output_0", "/Concat_171_output_0", "/Reshape_120_output_0", "/Reshape_125_output_0", "/FakeLinear_55_output_0", "/Add_68_output_0", "/post_attention_layernorm_13/Mul_1_output_0", "/mlp/gate_proj_13/FakeLinear_output_0", "/mlp/act_fn_13/Mul_output_0", "/mlp/up_proj_13/FakeLinear_output_0", "/mlp_13/Mul_output_0", "/mlp/down_proj_13/FakeLinear_output_0", "/Add_69_output_0", "/Reshape_126_output_0", "/input_layernorm_14/Mul_1_output_0", "/FakeLinear_56_output_0", "/Shape_196_output_0", "Shape5302", "BinaryOp5305", "BinaryOp5306", "Unsqueeze5307", "BinaryOp5309", "Unsqueeze5310", "StridedSlice5313", "BinaryOp5315", "BinaryOp5316", "/Gather_213_output_0", "/Unsqueeze_448_output_0", "Unsqueeze5324", "Unsqueeze5327", "StridedSlice5330", "Squeeze5331", "BinaryOp5332", "BinaryOp5333", "/Gather_214_output_0", "/Unsqueeze_449_output_0", "/Concat_182_output_0", "/Reshape_127_output_0", "/Mul_112_output_0", "/Shape_198_output_0", "Shape5434", "BinaryOp5437", "BinaryOp5438", "Unsqueeze5439", "BinaryOp5441", "Unsqueeze5442", "StridedSlice5445", "Squeeze5446", "BinaryOp5447", "BinaryOp5448", "/Gather_215_output_0", "/Div_42_output_0", "/Unsqueeze_455_output_0", "/Slice_57_output_0", "/Neg_28_output_0", "/Unsqueeze_454_output_0", "/Slice_56_output_0", "/Concat_185_output_0", "/Mul_113_output_0", "/Add_70_output_0", "/FakeLinear_57_output_0", "/Unsqueeze_450_output_0", "/Unsqueeze_451_output_0", "/Concat_183_output_0", "/Reshape_128_output_0", "/Mul_114_output_0", "/Shape_199_output_0", "Shape5340", "BinaryOp5343", "BinaryOp5344", "Unsqueeze5345", "BinaryOp5347", "Unsqueeze5348", "StridedSlice5351", "Squeeze5352", "BinaryOp5353", "BinaryOp5354", "/Gather_216_output_0", "/Div_43_output_0", "/Unsqueeze_457_output_0", "/Slice_59_output_0", "/Neg_29_output_0", "/Unsqueeze_456_output_0", "/Slice_58_output_0", "/Concat_186_output_0", "/Mul_115_output_0", "/Add_71_output_0", "/FakeLinear_58_output_0", "/Unsqueeze_452_output_0", "/Unsqueeze_453_output_0", "/Concat_184_output_0", "/Reshape_129_output_0", "/Reshape_134_output_0", "/FakeLinear_59_output_0", "/Add_73_output_0", "/post_attention_layernorm_14/Mul_1_output_0", "/mlp/gate_proj_14/FakeLinear_output_0", "/mlp/act_fn_14/Mul_output_0", "/mlp/up_proj_14/FakeLinear_output_0", "/mlp_14/Mul_output_0", "/mlp/down_proj_14/FakeLinear_output_0", "/Add_74_output_0", "/Reshape_135_output_0", "/input_layernorm_15/Mul_1_output_0", "/FakeLinear_60_output_0", "/Shape_210_output_0", "Shape5673", "BinaryOp5676", "BinaryOp5677", "Unsqueeze5678", "BinaryOp5680", "Unsqueeze5681", "StridedSlice5684", "BinaryOp5686", "BinaryOp5687", "/Gather_228_output_0", "/Unsqueeze_480_output_0", "Unsqueeze5695", "Unsqueeze5698", "StridedSlice5701", "Squeeze5702", "BinaryOp5703", "BinaryOp5704", "/Gather_229_output_0", "/Unsqueeze_481_output_0", "/Concat_195_output_0", "/Reshape_136_output_0", "/Mul_120_output_0", "/Shape_212_output_0", "Shape5805", "BinaryOp5808", "BinaryOp5809", "Unsqueeze5810", "BinaryOp5812", "Unsqueeze5813", "StridedSlice5816", "Squeeze5817", "BinaryOp5818", "BinaryOp5819", "/Gather_230_output_0", "/Div_45_output_0", "/Unsqueeze_487_output_0", "/Slice_61_output_0", "/Neg_30_output_0", "/Unsqueeze_486_output_0", "/Slice_60_output_0", "/Concat_198_output_0", "/Mul_121_output_0", "/Add_75_output_0", "/FakeLinear_61_output_0", "/Unsqueeze_482_output_0", "/Unsqueeze_483_output_0", "/Concat_196_output_0", "/Reshape_137_output_0", "/Mul_122_output_0", "/Shape_213_output_0", "Shape5711", "BinaryOp5714", "BinaryOp5715", "Unsqueeze5716", "BinaryOp5718", "Unsqueeze5719", "StridedSlice5722", "Squeeze5723", "BinaryOp5724", "BinaryOp5725", "/Gather_231_output_0", "/Div_46_output_0", "/Unsqueeze_489_output_0", "/Slice_63_output_0", "/Neg_31_output_0", "/Unsqueeze_488_output_0", "/Slice_62_output_0", "/Concat_199_output_0", "/Mul_123_output_0", "/Add_76_output_0", "/FakeLinear_62_output_0", "/Unsqueeze_484_output_0", "/Unsqueeze_485_output_0", "/Concat_197_output_0", "/Reshape_138_output_0", "/Reshape_143_output_0", "/FakeLinear_63_output_0", "/Add_78_output_0", "/post_attention_layernorm_15/Mul_1_output_0", "/mlp/gate_proj_15/FakeLinear_output_0", "/mlp/act_fn_15/Mul_output_0", "/mlp/up_proj_15/FakeLinear_output_0", "/mlp_15/Mul_output_0", "/mlp/down_proj_15/FakeLinear_output_0", "/Add_79_output_0", "/Reshape_144_output_0", "/input_layernorm_16/Mul_1_output_0", "/FakeLinear_64_output_0", "/Shape_224_output_0", "Shape6044", "BinaryOp6047", "BinaryOp6048", "Unsqueeze6049", "BinaryOp6051", "Unsqueeze6052", "StridedSlice6055", "BinaryOp6057", "BinaryOp6058", "/Gather_243_output_0", "/Unsqueeze_512_output_0", "Unsqueeze6066", "Unsqueeze6069", "StridedSlice6072", "Squeeze6073", "BinaryOp6074", "BinaryOp6075", "/Gather_244_output_0", "/Unsqueeze_513_output_0", "/Concat_208_output_0", "/Reshape_145_output_0", "/Mul_128_output_0", "/Shape_226_output_0", "Shape6176", "BinaryOp6179", "BinaryOp6180", "Unsqueeze6181", "BinaryOp6183", "Unsqueeze6184", "StridedSlice6187", "Squeeze6188", "BinaryOp6189", "BinaryOp6190", "/Gather_245_output_0", "/Div_48_output_0", "/Unsqueeze_519_output_0", "/Slice_65_output_0", "/Neg_32_output_0", "/Unsqueeze_518_output_0", "/Slice_64_output_0", "/Concat_211_output_0", "/Mul_129_output_0", "/Add_80_output_0", "/FakeLinear_65_output_0", "/Unsqueeze_514_output_0", "/Unsqueeze_515_output_0", "/Concat_209_output_0", "/Reshape_146_output_0", "/Mul_130_output_0", "/Shape_227_output_0", "Shape6082", "BinaryOp6085", "BinaryOp6086", "Unsqueeze6087", "BinaryOp6089", "Unsqueeze6090", "StridedSlice6093", "Squeeze6094", "BinaryOp6095", "BinaryOp6096", "/Gather_246_output_0", "/Div_49_output_0", "/Unsqueeze_521_output_0", "/Slice_67_output_0", "/Neg_33_output_0", "/Unsqueeze_520_output_0", "/Slice_66_output_0", "/Concat_212_output_0", "/Mul_131_output_0", "/Add_81_output_0", "/FakeLinear_66_output_0", "/Unsqueeze_516_output_0", "/Unsqueeze_517_output_0", "/Concat_210_output_0", "/Reshape_147_output_0", "/Reshape_152_output_0", "/FakeLinear_67_output_0", "/Add_83_output_0", "/post_attention_layernorm_16/Mul_1_output_0", "/mlp/gate_proj_16/FakeLinear_output_0", "/mlp/act_fn_16/Mul_output_0", "/mlp/up_proj_16/FakeLinear_output_0", "/mlp_16/Mul_output_0", "/mlp/down_proj_16/FakeLinear_output_0", "/Add_84_output_0", "/Reshape_153_output_0", "/input_layernorm_17/Mul_1_output_0", "/FakeLinear_68_output_0", "/Shape_238_output_0", "Shape6415", "BinaryOp6418", "BinaryOp6419", "Unsqueeze6420", "BinaryOp6422", "Unsqueeze6423", "StridedSlice6426", "BinaryOp6428", "BinaryOp6429", "/Gather_258_output_0", "/Unsqueeze_544_output_0", "Unsqueeze6437", "Unsqueeze6440", "StridedSlice6443", "Squeeze6444", "BinaryOp6445", "BinaryOp6446", "/Gather_259_output_0", "/Unsqueeze_545_output_0", "/Concat_221_output_0", "/Reshape_154_output_0", "/Mul_136_output_0", "/Shape_240_output_0", "Shape6547", "BinaryOp6550", "BinaryOp6551", "Unsqueeze6552", "BinaryOp6554", "Unsqueeze6555", "StridedSlice6558", "Squeeze6559", "BinaryOp6560", "BinaryOp6561", "/Gather_260_output_0", "/Div_51_output_0", "/Unsqueeze_551_output_0", "/Slice_69_output_0", "/Neg_34_output_0", "/Unsqueeze_550_output_0", "/Slice_68_output_0", "/Concat_224_output_0", "/Mul_137_output_0", "/Add_85_output_0", "/FakeLinear_69_output_0", "/Unsqueeze_546_output_0", "/Unsqueeze_547_output_0", "/Concat_222_output_0", "/Reshape_155_output_0", "/Mul_138_output_0", "/Shape_241_output_0", "Shape6453", "BinaryOp6456", "BinaryOp6457", "Unsqueeze6458", "BinaryOp6460", "Unsqueeze6461", "StridedSlice6464", "Squeeze6465", "BinaryOp6466", "BinaryOp6467", "/Gather_261_output_0", "/Div_52_output_0", "/Unsqueeze_553_output_0", "/Slice_71_output_0", "/Neg_35_output_0", "/Unsqueeze_552_output_0", "/Slice_70_output_0", "/Concat_225_output_0", "/Mul_139_output_0", "/Add_86_output_0", "/FakeLinear_70_output_0", "/Unsqueeze_548_output_0", "/Unsqueeze_549_output_0", "/Concat_223_output_0", "/Reshape_156_output_0", "/Reshape_161_output_0", "/FakeLinear_71_output_0", "/Add_88_output_0", "/post_attention_layernorm_17/Mul_1_output_0", "/mlp/gate_proj_17/FakeLinear_output_0", "/mlp/act_fn_17/Mul_output_0", "/mlp/up_proj_17/FakeLinear_output_0", "/mlp_17/Mul_output_0", "/mlp/down_proj_17/FakeLinear_output_0", "/Add_89_output_0", "/Reshape_162_output_0", "/input_layernorm_18/Mul_1_output_0", "/FakeLinear_72_output_0", "/Shape_252_output_0", "Shape6786", "BinaryOp6789", "BinaryOp6790", "Unsqueeze6791", "BinaryOp6793", "Unsqueeze6794", "StridedSlice6797", "BinaryOp6799", "BinaryOp6800", "/Gather_273_output_0", "/Unsqueeze_576_output_0", "Unsqueeze6808", "Unsqueeze6811", "StridedSlice6814", "Squeeze6815", "BinaryOp6816", "BinaryOp6817", "/Gather_274_output_0", "/Unsqueeze_577_output_0", "/Concat_234_output_0", "/Reshape_163_output_0", "/Mul_144_output_0", "/Shape_254_output_0", "Shape6918", "BinaryOp6921", "BinaryOp6922", "Unsqueeze6923", "BinaryOp6925", "Unsqueeze6926", "StridedSlice6929", "Squeeze6930", "BinaryOp6931", "BinaryOp6932", "/Gather_275_output_0", "/Div_54_output_0", "/Unsqueeze_583_output_0", "/Slice_73_output_0", "/Neg_36_output_0", "/Unsqueeze_582_output_0", "/Slice_72_output_0", "/Concat_237_output_0", "/Mul_145_output_0", "/Add_90_output_0", "/FakeLinear_73_output_0", "/Unsqueeze_578_output_0", "/Unsqueeze_579_output_0", "/Concat_235_output_0", "/Reshape_164_output_0", "/Mul_146_output_0", "/Shape_255_output_0", "Shape6824", "BinaryOp6827", "BinaryOp6828", "Unsqueeze6829", "BinaryOp6831", "Unsqueeze6832", "StridedSlice6835", "Squeeze6836", "BinaryOp6837", "BinaryOp6838", "/Gather_276_output_0", "/Div_55_output_0", "/Unsqueeze_585_output_0", "/Slice_75_output_0", "/Neg_37_output_0", "/Unsqueeze_584_output_0", "/Slice_74_output_0", "/Concat_238_output_0", "/Mul_147_output_0", "/Add_91_output_0", "/FakeLinear_74_output_0", "/Unsqueeze_580_output_0", "/Unsqueeze_581_output_0", "/Concat_236_output_0", "/Reshape_165_output_0", "/Reshape_170_output_0", "/FakeLinear_75_output_0", "/Add_93_output_0", "/post_attention_layernorm_18/Mul_1_output_0", "/mlp/gate_proj_18/FakeLinear_output_0", "/mlp/act_fn_18/Mul_output_0", "/mlp/up_proj_18/FakeLinear_output_0", "/mlp_18/Mul_output_0", "/mlp/down_proj_18/FakeLinear_output_0", "/Add_94_output_0", "/Reshape_171_output_0", "/input_layernorm_19/Mul_1_output_0", "/FakeLinear_76_output_0", "/Shape_266_output_0", "Shape7157", "BinaryOp7160", "BinaryOp7161", "Unsqueeze7162", "BinaryOp7164", "Unsqueeze7165", "StridedSlice7168", "BinaryOp7170", "BinaryOp7171", "/Gather_288_output_0", "/Unsqueeze_608_output_0", "Unsqueeze7179", "Unsqueeze7182", "StridedSlice7185", "Squeeze7186", "BinaryOp7187", "BinaryOp7188", "/Gather_289_output_0", "/Unsqueeze_609_output_0", "/Concat_247_output_0", "/Reshape_172_output_0", "/Mul_152_output_0", "/Shape_268_output_0", "Shape7289", "BinaryOp7292", "BinaryOp7293", "Unsqueeze7294", "BinaryOp7296", "Unsqueeze7297", "StridedSlice7300", "Squeeze7301", "BinaryOp7302", "BinaryOp7303", "/Gather_290_output_0", "/Div_57_output_0", "/Unsqueeze_615_output_0", "/Slice_77_output_0", "/Neg_38_output_0", "/Unsqueeze_614_output_0", "/Slice_76_output_0", "/Concat_250_output_0", "/Mul_153_output_0", "/Add_95_output_0", "/FakeLinear_77_output_0", "/Unsqueeze_610_output_0", "/Unsqueeze_611_output_0", "/Concat_248_output_0", "/Reshape_173_output_0", "/Mul_154_output_0", "/Shape_269_output_0", "Shape7195", "BinaryOp7198", "BinaryOp7199", "Unsqueeze7200", "BinaryOp7202", "Unsqueeze7203", "StridedSlice7206", "Squeeze7207", "BinaryOp7208", "BinaryOp7209", "/Gather_291_output_0", "/Div_58_output_0", "/Unsqueeze_617_output_0", "/Slice_79_output_0", "/Neg_39_output_0", "/Unsqueeze_616_output_0", "/Slice_78_output_0", "/Concat_251_output_0", "/Mul_155_output_0", "/Add_96_output_0", "/FakeLinear_78_output_0", "/Unsqueeze_612_output_0", "/Unsqueeze_613_output_0", "/Concat_249_output_0", "/Reshape_174_output_0", "/Reshape_179_output_0", "/FakeLinear_79_output_0", "/Add_98_output_0", "/post_attention_layernorm_19/Mul_1_output_0", "/mlp/gate_proj_19/FakeLinear_output_0", "/mlp/act_fn_19/Mul_output_0", "/mlp/up_proj_19/FakeLinear_output_0", "/mlp_19/Mul_output_0", "/mlp/down_proj_19/FakeLinear_output_0", "/Add_99_output_0", "/Reshape_180_output_0", "/input_layernorm_20/Mul_1_output_0", "/FakeLinear_80_output_0", "/Shape_280_output_0", "Shape7528", "BinaryOp7531", "BinaryOp7532", "Unsqueeze7533", "BinaryOp7535", "Unsqueeze7536", "StridedSlice7539", "BinaryOp7541", "BinaryOp7542", "/Gather_303_output_0", "/Unsqueeze_640_output_0", "Unsqueeze7550", "Unsqueeze7553", "StridedSlice7556", "Squeeze7557", "BinaryOp7558", "BinaryOp7559", "/Gather_304_output_0", "/Unsqueeze_641_output_0", "/Concat_260_output_0", "/Reshape_181_output_0", "/Mul_160_output_0", "/Shape_282_output_0", "Shape7660", "BinaryOp7663", "BinaryOp7664", "Unsqueeze7665", "BinaryOp7667", "Unsqueeze7668", "StridedSlice7671", "Squeeze7672", "BinaryOp7673", "BinaryOp7674", "/Gather_305_output_0", "/Div_60_output_0", "/Unsqueeze_647_output_0", "/Slice_81_output_0", "/Neg_40_output_0", "/Unsqueeze_646_output_0", "/Slice_80_output_0", "/Concat_263_output_0", "/Mul_161_output_0", "/Add_100_output_0", "/FakeLinear_81_output_0", "/Unsqueeze_642_output_0", "/Unsqueeze_643_output_0", "/Concat_261_output_0", "/Reshape_182_output_0", "/Mul_162_output_0", "/Shape_283_output_0", "Shape7566", "BinaryOp7569", "BinaryOp7570", "Unsqueeze7571", "BinaryOp7573", "Unsqueeze7574", "StridedSlice7577", "Squeeze7578", "BinaryOp7579", "BinaryOp7580", "/Gather_306_output_0", "/Div_61_output_0", "/Unsqueeze_649_output_0", "/Slice_83_output_0", "/Neg_41_output_0", "/Unsqueeze_648_output_0", "/Slice_82_output_0", "/Concat_264_output_0", "/Mul_163_output_0", "/Add_101_output_0", "/FakeLinear_82_output_0", "/Unsqueeze_644_output_0", "/Unsqueeze_645_output_0", "/Concat_262_output_0", "/Reshape_183_output_0", "/Reshape_188_output_0", "/FakeLinear_83_output_0", "/Add_103_output_0", "/post_attention_layernorm_20/Mul_1_output_0", "/mlp/gate_proj_20/FakeLinear_output_0", "/mlp/act_fn_20/Mul_output_0", "/mlp/up_proj_20/FakeLinear_output_0", "/mlp_20/Mul_output_0", "/mlp/down_proj_20/FakeLinear_output_0", "/Add_104_output_0", "/Reshape_189_output_0", "/input_layernorm_21/Mul_1_output_0", "/FakeLinear_84_output_0", "/Shape_294_output_0", "Shape7899", "BinaryOp7902", "BinaryOp7903", "Unsqueeze7904", "BinaryOp7906", "Unsqueeze7907", "StridedSlice7910", "BinaryOp7912", "BinaryOp7913", "/Gather_318_output_0", "/Unsqueeze_672_output_0", "Unsqueeze7921", "Unsqueeze7924", "StridedSlice7927", "Squeeze7928", "BinaryOp7929", "BinaryOp7930", "/Gather_319_output_0", "/Unsqueeze_673_output_0", "/Concat_273_output_0", "/Reshape_190_output_0", "/Mul_168_output_0", "/Shape_296_output_0", "Shape8031", "BinaryOp8034", "BinaryOp8035", "Unsqueeze8036", "BinaryOp8038", "Unsqueeze8039", "StridedSlice8042", "Squeeze8043", "BinaryOp8044", "BinaryOp8045", "/Gather_320_output_0", "/Div_63_output_0", "/Unsqueeze_679_output_0", "/Slice_85_output_0", "/Neg_42_output_0", "/Unsqueeze_678_output_0", "/Slice_84_output_0", "/Concat_276_output_0", "/Mul_169_output_0", "/Add_105_output_0", "/FakeLinear_85_output_0", "/Unsqueeze_674_output_0", "/Unsqueeze_675_output_0", "/Concat_274_output_0", "/Reshape_191_output_0", "/Mul_170_output_0", "/Shape_297_output_0", "Shape7937", "BinaryOp7940", "BinaryOp7941", "Unsqueeze7942", "BinaryOp7944", "Unsqueeze7945", "StridedSlice7948", "Squeeze7949", "BinaryOp7950", "BinaryOp7951", "/Gather_321_output_0", "/Div_64_output_0", "/Unsqueeze_681_output_0", "/Slice_87_output_0", "/Neg_43_output_0", "/Unsqueeze_680_output_0", "/Slice_86_output_0", "/Concat_277_output_0", "/Mul_171_output_0", "/Add_106_output_0", "/FakeLinear_86_output_0", "/Unsqueeze_676_output_0", "/Unsqueeze_677_output_0", "/Concat_275_output_0", "/Reshape_192_output_0", "/Reshape_197_output_0", "/FakeLinear_87_output_0", "/Add_108_output_0", "/post_attention_layernorm_21/Mul_1_output_0", "/mlp/gate_proj_21/FakeLinear_output_0", "/mlp/act_fn_21/Mul_output_0", "/mlp/up_proj_21/FakeLinear_output_0", "/mlp_21/Mul_output_0", "/mlp/down_proj_21/FakeLinear_output_0", "/Add_109_output_0", "/Reshape_198_output_0", "/input_layernorm_22/Mul_1_output_0", "/FakeLinear_88_output_0", "/Shape_308_output_0", "Shape8270", "BinaryOp8273", "BinaryOp8274", "Unsqueeze8275", "BinaryOp8277", "Unsqueeze8278", "StridedSlice8281", "BinaryOp8283", "BinaryOp8284", "/Gather_333_output_0", "/Unsqueeze_704_output_0", "Unsqueeze8292", "Unsqueeze8295", "StridedSlice8298", "Squeeze8299", "BinaryOp8300", "BinaryOp8301", "/Gather_334_output_0", "/Unsqueeze_705_output_0", "/Concat_286_output_0", "/Reshape_199_output_0", "/Mul_176_output_0", "/Shape_310_output_0", "Shape8402", "BinaryOp8405", "BinaryOp8406", "Unsqueeze8407", "BinaryOp8409", "Unsqueeze8410", "StridedSlice8413", "Squeeze8414", "BinaryOp8415", "BinaryOp8416", "/Gather_335_output_0", "/Div_66_output_0", "/Unsqueeze_711_output_0", "/Slice_89_output_0", "/Neg_44_output_0", "/Unsqueeze_710_output_0", "/Slice_88_output_0", "/Concat_289_output_0", "/Mul_177_output_0", "/Add_110_output_0", "/FakeLinear_89_output_0", "/Unsqueeze_706_output_0", "/Unsqueeze_707_output_0", "/Concat_287_output_0", "/Reshape_200_output_0", "/Mul_178_output_0", "/Shape_311_output_0", "Shape8308", "BinaryOp8311", "BinaryOp8312", "Unsqueeze8313", "BinaryOp8315", "Unsqueeze8316", "StridedSlice8319", "Squeeze8320", "BinaryOp8321", "BinaryOp8322", "/Gather_336_output_0", "/Div_67_output_0", "/Unsqueeze_713_output_0", "/Slice_91_output_0", "/Neg_45_output_0", "/Unsqueeze_712_output_0", "/Slice_90_output_0", "/Concat_290_output_0", "/Mul_179_output_0", "/Add_111_output_0", "/FakeLinear_90_output_0", "/Unsqueeze_708_output_0", "/Unsqueeze_709_output_0", "/Concat_288_output_0", "/Reshape_201_output_0", "/Reshape_206_output_0", "/FakeLinear_91_output_0", "/Add_113_output_0", "/post_attention_layernorm_22/Mul_1_output_0", "/mlp/gate_proj_22/FakeLinear_output_0", "/mlp/act_fn_22/Mul_output_0", "/mlp/up_proj_22/FakeLinear_output_0", "/mlp_22/Mul_output_0", "/mlp/down_proj_22/FakeLinear_output_0", "/Add_114_output_0", "/Reshape_207_output_0", "/input_layernorm_23/Mul_1_output_0", "/FakeLinear_92_output_0", "/Shape_322_output_0", "Shape8641", "BinaryOp8644", "BinaryOp8645", "Unsqueeze8646", "BinaryOp8648", "Unsqueeze8649", "StridedSlice8652", "BinaryOp8654", "BinaryOp8655", "/Gather_348_output_0", "/Unsqueeze_736_output_0", "Unsqueeze8663", "Unsqueeze8666", "StridedSlice8669", "Squeeze8670", "BinaryOp8671", "BinaryOp8672", "/Gather_349_output_0", "/Unsqueeze_737_output_0", "/Concat_299_output_0", "/Reshape_208_output_0", "/Mul_184_output_0", "/Shape_324_output_0", "Shape8773", "BinaryOp8776", "BinaryOp8777", "Unsqueeze8778", "BinaryOp8780", "Unsqueeze8781", "StridedSlice8784", "Squeeze8785", "BinaryOp8786", "BinaryOp8787", "/Gather_350_output_0", "/Div_69_output_0", "/Unsqueeze_743_output_0", "/Slice_93_output_0", "/Neg_46_output_0", "/Unsqueeze_742_output_0", "/Slice_92_output_0", "/Concat_302_output_0", "/Mul_185_output_0", "/Add_115_output_0", "/FakeLinear_93_output_0", "/Unsqueeze_738_output_0", "/Unsqueeze_739_output_0", "/Concat_300_output_0", "/Reshape_209_output_0", "/Mul_186_output_0", "/Shape_325_output_0", "Shape8679", "BinaryOp8682", "BinaryOp8683", "Unsqueeze8684", "BinaryOp8686", "Unsqueeze8687", "StridedSlice8690", "Squeeze8691", "BinaryOp8692", "BinaryOp8693", "/Gather_351_output_0", "/Div_70_output_0", "/Unsqueeze_745_output_0", "/Slice_95_output_0", "/Neg_47_output_0", "/Unsqueeze_744_output_0", "/Slice_94_output_0", "/Concat_303_output_0", "/Mul_187_output_0", "/Add_116_output_0", "/FakeLinear_94_output_0", "/Unsqueeze_740_output_0", "/Unsqueeze_741_output_0", "/Concat_301_output_0", "/Reshape_210_output_0", "/Reshape_215_output_0", "/FakeLinear_95_output_0", "/Add_118_output_0", "/post_attention_layernorm_23/Mul_1_output_0", "/mlp/gate_proj_23/FakeLinear_output_0", "/mlp/act_fn_23/Mul_output_0", "/mlp/up_proj_23/FakeLinear_output_0", "/mlp_23/Mul_output_0", "/mlp/down_proj_23/FakeLinear_output_0", "/Add_119_output_0", "/Reshape_216_output_0", "/input_layernorm_24/Mul_1_output_0", "/FakeLinear_96_output_0", "/Shape_336_output_0", "Shape9012", "BinaryOp9015", "BinaryOp9016", "Unsqueeze9017", "BinaryOp9019", "Unsqueeze9020", "StridedSlice9023", "BinaryOp9025", "BinaryOp9026", "/Gather_363_output_0", "/Unsqueeze_768_output_0", "Unsqueeze9034", "Unsqueeze9037", "StridedSlice9040", "Squeeze9041", "BinaryOp9042", "BinaryOp9043", "/Gather_364_output_0", "/Unsqueeze_769_output_0", "/Concat_312_output_0", "/Reshape_217_output_0", "/Mul_192_output_0", "/Shape_338_output_0", "Shape9144", "BinaryOp9147", "BinaryOp9148", "Unsqueeze9149", "BinaryOp9151", "Unsqueeze9152", "StridedSlice9155", "Squeeze9156", "BinaryOp9157", "BinaryOp9158", "/Gather_365_output_0", "/Div_72_output_0", "/Unsqueeze_775_output_0", "/Slice_97_output_0", "/Neg_48_output_0", "/Unsqueeze_774_output_0", "/Slice_96_output_0", "/Concat_315_output_0", "/Mul_193_output_0", "/Add_120_output_0", "/FakeLinear_97_output_0", "/Unsqueeze_770_output_0", "/Unsqueeze_771_output_0", "/Concat_313_output_0", "/Reshape_218_output_0", "/Mul_194_output_0", "/Shape_339_output_0", "Shape9050", "BinaryOp9053", "BinaryOp9054", "Unsqueeze9055", "BinaryOp9057", "Unsqueeze9058", "StridedSlice9061", "Squeeze9062", "BinaryOp9063", "BinaryOp9064", "/Gather_366_output_0", "/Div_73_output_0", "/Unsqueeze_777_output_0", "/Slice_99_output_0", "/Neg_49_output_0", "/Unsqueeze_776_output_0", "/Slice_98_output_0", "/Concat_316_output_0", "/Mul_195_output_0", "/Add_121_output_0", "/FakeLinear_98_output_0", "/Unsqueeze_772_output_0", "/Unsqueeze_773_output_0", "/Concat_314_output_0", "/Reshape_219_output_0", "/Reshape_224_output_0", "/FakeLinear_99_output_0", "/Add_123_output_0", "/post_attention_layernorm_24/Mul_1_output_0", "/mlp/gate_proj_24/FakeLinear_output_0", "/mlp/act_fn_24/Mul_output_0", "/mlp/up_proj_24/FakeLinear_output_0", "/mlp_24/Mul_output_0", "/mlp/down_proj_24/FakeLinear_output_0", "/Add_124_output_0", "/Reshape_225_output_0", "/input_layernorm_25/Mul_1_output_0", "/FakeLinear_100_output_0", "/Shape_350_output_0", "Shape9383", "BinaryOp9386", "BinaryOp9387", "Unsqueeze9388", "BinaryOp9390", "Unsqueeze9391", "StridedSlice9394", "BinaryOp9396", "BinaryOp9397", "/Gather_378_output_0", "/Unsqueeze_800_output_0", "Unsqueeze9405", "Unsqueeze9408", "StridedSlice9411", "Squeeze9412", "BinaryOp9413", "BinaryOp9414", "/Gather_379_output_0", "/Unsqueeze_801_output_0", "/Concat_325_output_0", "/Reshape_226_output_0", "/Mul_200_output_0", "/Shape_352_output_0", "Shape9515", "BinaryOp9518", "BinaryOp9519", "Unsqueeze9520", "BinaryOp9522", "Unsqueeze9523", "StridedSlice9526", "Squeeze9527", "BinaryOp9528", "BinaryOp9529", "/Gather_380_output_0", "/Div_75_output_0", "/Unsqueeze_807_output_0", "/Slice_101_output_0", "/Neg_50_output_0", "/Unsqueeze_806_output_0", "/Slice_100_output_0", "/Concat_328_output_0", "/Mul_201_output_0", "/Add_125_output_0", "/FakeLinear_101_output_0", "/Unsqueeze_802_output_0", "/Unsqueeze_803_output_0", "/Concat_326_output_0", "/Reshape_227_output_0", "/Mul_202_output_0", "/Shape_353_output_0", "Shape9421", "BinaryOp9424", "BinaryOp9425", "Unsqueeze9426", "BinaryOp9428", "Unsqueeze9429", "StridedSlice9432", "Squeeze9433", "BinaryOp9434", "BinaryOp9435", "/Gather_381_output_0", "/Div_76_output_0", "/Unsqueeze_809_output_0", "/Slice_103_output_0", "/Neg_51_output_0", "/Unsqueeze_808_output_0", "/Slice_102_output_0", "/Concat_329_output_0", "/Mul_203_output_0", "/Add_126_output_0", "/FakeLinear_102_output_0", "/Unsqueeze_804_output_0", "/Unsqueeze_805_output_0", "/Concat_327_output_0", "/Reshape_228_output_0", "/Reshape_233_output_0", "/FakeLinear_103_output_0", "/Add_128_output_0", "/post_attention_layernorm_25/Mul_1_output_0", "/mlp/gate_proj_25/FakeLinear_output_0", "/mlp/act_fn_25/Mul_output_0", "/mlp/up_proj_25/FakeLinear_output_0", "/mlp_25/Mul_output_0", "/mlp/down_proj_25/FakeLinear_output_0", "/Add_129_output_0", "/Reshape_234_output_0", "/input_layernorm_26/Mul_1_output_0", "/FakeLinear_104_output_0", "/Shape_364_output_0", "Shape9754", "BinaryOp9757", "BinaryOp9758", "Unsqueeze9759", "BinaryOp9761", "Unsqueeze9762", "StridedSlice9765", "BinaryOp9767", "BinaryOp9768", "/Gather_393_output_0", "/Unsqueeze_832_output_0", "Unsqueeze9776", "Unsqueeze9779", "StridedSlice9782", "Squeeze9783", "BinaryOp9784", "BinaryOp9785", "/Gather_394_output_0", "/Unsqueeze_833_output_0", "/Concat_338_output_0", "/Reshape_235_output_0", "/Mul_208_output_0", "/Shape_366_output_0", "Shape9886", "BinaryOp9889", "BinaryOp9890", "Unsqueeze9891", "BinaryOp9893", "Unsqueeze9894", "StridedSlice9897", "Squeeze9898", "BinaryOp9899", "BinaryOp9900", "/Gather_395_output_0", "/Div_78_output_0", "/Unsqueeze_839_output_0", "/Slice_105_output_0", "/Neg_52_output_0", "/Unsqueeze_838_output_0", "/Slice_104_output_0", "/Concat_341_output_0", "/Mul_209_output_0", "/Add_130_output_0", "/FakeLinear_105_output_0", "/Unsqueeze_834_output_0", "/Unsqueeze_835_output_0", "/Concat_339_output_0", "/Reshape_236_output_0", "/Mul_210_output_0", "/Shape_367_output_0", "Shape9792", "BinaryOp9795", "BinaryOp9796", "Unsqueeze9797", "BinaryOp9799", "Unsqueeze9800", "StridedSlice9803", "Squeeze9804", "BinaryOp9805", "BinaryOp9806", "/Gather_396_output_0", "/Div_79_output_0", "/Unsqueeze_841_output_0", "/Slice_107_output_0", "/Neg_53_output_0", "/Unsqueeze_840_output_0", "/Slice_106_output_0", "/Concat_342_output_0", "/Mul_211_output_0", "/Add_131_output_0", "/FakeLinear_106_output_0", "/Unsqueeze_836_output_0", "/Unsqueeze_837_output_0", "/Concat_340_output_0", "/Reshape_237_output_0", "/Reshape_242_output_0", "/FakeLinear_107_output_0", "/Add_133_output_0", "/post_attention_layernorm_26/Mul_1_output_0", "/mlp/gate_proj_26/FakeLinear_output_0", "/mlp/act_fn_26/Mul_output_0", "/mlp/up_proj_26/FakeLinear_output_0", "/mlp_26/Mul_output_0", "/mlp/down_proj_26/FakeLinear_output_0", "/Add_134_output_0", "/Reshape_243_output_0", "/input_layernorm_27/Mul_1_output_0", "/FakeLinear_108_output_0", "/Shape_378_output_0", "Shape10125", "BinaryOp10128", "BinaryOp10129", "Unsqueeze10130", "BinaryOp10132", "Unsqueeze10133", "StridedSlice10136", "BinaryOp10138", "BinaryOp10139", "/Gather_408_output_0", "/Unsqueeze_864_output_0", "Unsqueeze10147", "Unsqueeze10150", "StridedSlice10153", "Squeeze10154", "BinaryOp10155", "BinaryOp10156", "/Gather_409_output_0", "/Unsqueeze_865_output_0", "/Concat_351_output_0", "/Reshape_244_output_0", "/Mul_216_output_0", "/Shape_380_output_0", "Shape10257", "BinaryOp10260", "BinaryOp10261", "Unsqueeze10262", "BinaryOp10264", "Unsqueeze10265", "StridedSlice10268", "Squeeze10269", "BinaryOp10270", "BinaryOp10271", "/Gather_410_output_0", "/Div_81_output_0", "/Unsqueeze_871_output_0", "/Slice_109_output_0", "/Neg_54_output_0", "/Unsqueeze_870_output_0", "/Slice_108_output_0", "/Concat_354_output_0", "/Mul_217_output_0", "/Add_135_output_0", "/FakeLinear_109_output_0", "/Unsqueeze_866_output_0", "/Unsqueeze_867_output_0", "/Concat_352_output_0", "/Reshape_245_output_0", "/Mul_218_output_0", "/Shape_381_output_0", "Shape10163", "BinaryOp10166", "BinaryOp10167", "Unsqueeze10168", "BinaryOp10170", "Unsqueeze10171", "StridedSlice10174", "Squeeze10175", "BinaryOp10176", "BinaryOp10177", "/Gather_411_output_0", "/Div_82_output_0", "/Unsqueeze_873_output_0", "/Slice_111_output_0", "/Neg_55_output_0", "/Unsqueeze_872_output_0", "/Slice_110_output_0", "/Concat_355_output_0", "/Mul_219_output_0", "/Add_136_output_0", "/FakeLinear_110_output_0", "/Unsqueeze_868_output_0", "/Unsqueeze_869_output_0", "/Concat_353_output_0", "/Reshape_246_output_0", "/Reshape_251_output_0", "/FakeLinear_111_output_0", "/Add_138_output_0", "/post_attention_layernorm_27/Mul_1_output_0", "/mlp/gate_proj_27/FakeLinear_output_0", "/mlp/act_fn_27/Mul_output_0", "/mlp/up_proj_27/FakeLinear_output_0", "/mlp_27/Mul_output_0", "/mlp/down_proj_27/FakeLinear_output_0", "/Add_139_output_0", "/Reshape_252_output_0", "/input_layernorm_28/Mul_1_output_0", "/FakeLinear_112_output_0", "/Shape_392_output_0", "Shape10496", "BinaryOp10499", "BinaryOp10500", "Unsqueeze10501", "BinaryOp10503", "Unsqueeze10504", "StridedSlice10507", "BinaryOp10509", "BinaryOp10510", "/Gather_423_output_0", "/Unsqueeze_896_output_0", "Unsqueeze10518", "Unsqueeze10521", "StridedSlice10524", "Squeeze10525", "BinaryOp10526", "BinaryOp10527", "/Gather_424_output_0", "/Unsqueeze_897_output_0", "/Concat_364_output_0", "/Reshape_253_output_0", "/Mul_224_output_0", "/Shape_394_output_0", "Shape10628", "BinaryOp10631", "BinaryOp10632", "Unsqueeze10633", "BinaryOp10635", "Unsqueeze10636", "StridedSlice10639", "Squeeze10640", "BinaryOp10641", "BinaryOp10642", "/Gather_425_output_0", "/Div_84_output_0", "/Unsqueeze_903_output_0", "/Slice_113_output_0", "/Neg_56_output_0", "/Unsqueeze_902_output_0", "/Slice_112_output_0", "/Concat_367_output_0", "/Mul_225_output_0", "/Add_140_output_0", "/FakeLinear_113_output_0", "/Unsqueeze_898_output_0", "/Unsqueeze_899_output_0", "/Concat_365_output_0", "/Reshape_254_output_0", "/Mul_226_output_0", "/Shape_395_output_0", "Shape10534", "BinaryOp10537", "BinaryOp10538", "Unsqueeze10539", "BinaryOp10541", "Unsqueeze10542", "StridedSlice10545", "Squeeze10546", "BinaryOp10547", "BinaryOp10548", "/Gather_426_output_0", "/Div_85_output_0", "/Unsqueeze_905_output_0", "/Slice_115_output_0", "/Neg_57_output_0", "/Unsqueeze_904_output_0", "/Slice_114_output_0", "/Concat_368_output_0", "/Mul_227_output_0", "/Add_141_output_0", "/FakeLinear_114_output_0", "/Unsqueeze_900_output_0", "/Unsqueeze_901_output_0", "/Concat_366_output_0", "/Reshape_255_output_0", "/Reshape_260_output_0", "/FakeLinear_115_output_0", "/Add_143_output_0", "/post_attention_layernorm_28/Mul_1_output_0", "/mlp/gate_proj_28/FakeLinear_output_0", "/mlp/act_fn_28/Mul_output_0", "/mlp/up_proj_28/FakeLinear_output_0", "/mlp_28/Mul_output_0", "/mlp/down_proj_28/FakeLinear_output_0", "/Add_144_output_0", "/Reshape_261_output_0", "/input_layernorm_29/Mul_1_output_0", "/FakeLinear_116_output_0", "/Shape_406_output_0", "Shape10867", "BinaryOp10870", "BinaryOp10871", "Unsqueeze10872", "BinaryOp10874", "Unsqueeze10875", "StridedSlice10878", "BinaryOp10880", "BinaryOp10881", "/Gather_438_output_0", "/Unsqueeze_928_output_0", "Unsqueeze10889", "Unsqueeze10892", "StridedSlice10895", "Squeeze10896", "BinaryOp10897", "BinaryOp10898", "/Gather_439_output_0", "/Unsqueeze_929_output_0", "/Concat_377_output_0", "/Reshape_262_output_0", "/Mul_232_output_0", "/Shape_408_output_0", "Shape10967", "BinaryOp10970", "BinaryOp10971", "Unsqueeze10972", "BinaryOp10974", "Unsqueeze10975", "StridedSlice10978", "Squeeze10979", "BinaryOp10980", "BinaryOp10981", "/Gather_440_output_0", "/Div_87_output_0", "/Unsqueeze_935_output_0", "/Slice_117_output_0", "/Neg_58_output_0", "/Unsqueeze_934_output_0", "/Slice_116_output_0", "/Concat_380_output_0", "/Mul_233_output_0", "/Add_145_output_0", "/FakeLinear_117_output_0", "/Unsqueeze_930_output_0", "/Unsqueeze_931_output_0", "/Concat_378_output_0", "/Reshape_263_output_0", "/Mul_234_output_0", "/Shape_409_output_0", "Shape10905", "BinaryOp10908", "BinaryOp10909", "Unsqueeze10910", "BinaryOp10912", "Unsqueeze10913", "StridedSlice10916", "Squeeze10917", "BinaryOp10918", "BinaryOp10919", "/Gather_441_output_0", "/Div_88_output_0", "/Unsqueeze_937_output_0", "/Slice_119_output_0", "/Neg_59_output_0", "/Unsqueeze_936_output_0", "/Slice_118_output_0", "/Concat_381_output_0", "/Mul_235_output_0", "/Add_146_output_0", "/FakeLinear_118_output_0", "/Unsqueeze_932_output_0", "/Unsqueeze_933_output_0", "/Concat_379_output_0", "/Reshape_264_output_0", "/Reshape_269_output_0", "/FakeLinear_119_output_0", "/Add_148_output_0", "/post_attention_layernorm_29/Mul_1_output_0", "/mlp/gate_proj_29/FakeLinear_output_0", "/mlp/act_fn_29/Mul_output_0", "/mlp/up_proj_29/FakeLinear_output_0", "/mlp_29/Mul_output_0", "/mlp/down_proj_29/FakeLinear_output_0", "/Add_149_output_0", "logits_index", "/lm/Slice_output_0", "/lm/norm/Mul_1_output_0", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/layers.24/self_attn/q_proj/Linear/pre_reshape", "/layers.24/self_attn/q_proj/Linear/pre_convert", "/layers.24/self_attn/q_proj/Linear", "/layers.24/self_attn/q_proj/Linear/post_convert", "/layers.24/self_attn/k_proj/Linear/pre_reshape", "/layers.24/self_attn/k_proj/Linear/pre_convert", "/layers.24/self_attn/k_proj/Linear", "/layers.24/self_attn/k_proj/Linear/post_convert", "/layers.24/self_attn/v_proj/Linear/pre_reshape", "/layers.24/self_attn/v_proj/Linear/pre_convert", "/layers.24/self_attn/v_proj/Linear", "/layers.24/self_attn/v_proj/Linear/post_convert", "/layers.24/self_attn/o_proj/Linear/pre_reshape", "/layers.24/self_attn/o_proj/Linear/pre_convert", "/layers.24/self_attn/o_proj/Linear", "/layers.24/self_attn/o_proj/Linear/post_convert", "/layers.24/mlp/gate_proj/Linear/pre_reshape", "/layers.24/mlp/gate_proj/Linear/pre_convert", "/layers.24/mlp/gate_proj/Linear", "/layers.24/mlp/gate_proj/Linear/post_convert", "/layers.24/mlp/up_proj/Linear/pre_reshape", "/layers.24/mlp/up_proj/Linear/pre_convert", "/layers.24/mlp/up_proj/Linear", "/layers.24/mlp/up_proj/Linear/post_convert", "/layers.24/mlp/down_proj/Linear/pre_reshape", "/layers.24/mlp/down_proj/Linear/pre_convert", "/layers.24/mlp/down_proj/Linear", "/layers.24/mlp/down_proj/Linear/post_convert", "/layers.25/self_attn/q_proj/Linear/pre_reshape", "/layers.25/self_attn/q_proj/Linear/pre_convert", "/layers.25/self_attn/q_proj/Linear", "/layers.25/self_attn/q_proj/Linear/post_convert", "/layers.25/self_attn/k_proj/Linear/pre_reshape", "/layers.25/self_attn/k_proj/Linear/pre_convert", "/layers.25/self_attn/k_proj/Linear", "/layers.25/self_attn/k_proj/Linear/post_convert", "/layers.25/self_attn/v_proj/Linear/pre_reshape", "/layers.25/self_attn/v_proj/Linear/pre_convert", "/layers.25/self_attn/v_proj/Linear", "/layers.25/self_attn/v_proj/Linear/post_convert", "/layers.25/self_attn/o_proj/Linear/pre_reshape", "/layers.25/self_attn/o_proj/Linear/pre_convert", "/layers.25/self_attn/o_proj/Linear", "/layers.25/self_attn/o_proj/Linear/post_convert", "/layers.25/mlp/gate_proj/Linear/pre_reshape", "/layers.25/mlp/gate_proj/Linear/pre_convert", "/layers.25/mlp/gate_proj/Linear", "/layers.25/mlp/gate_proj/Linear/post_convert", "/layers.25/mlp/up_proj/Linear/pre_reshape", "/layers.25/mlp/up_proj/Linear/pre_convert", "/layers.25/mlp/up_proj/Linear", "/layers.25/mlp/up_proj/Linear/post_convert", "/layers.25/mlp/down_proj/Linear/pre_reshape", "/layers.25/mlp/down_proj/Linear/pre_convert", "/layers.25/mlp/down_proj/Linear", "/layers.25/mlp/down_proj/Linear/post_convert", "/layers.26/self_attn/q_proj/Linear/pre_reshape", "/layers.26/self_attn/q_proj/Linear/pre_convert", "/layers.26/self_attn/q_proj/Linear", "/layers.26/self_attn/q_proj/Linear/post_convert", "/layers.26/self_attn/k_proj/Linear/pre_reshape", "/layers.26/self_attn/k_proj/Linear/pre_convert", "/layers.26/self_attn/k_proj/Linear", "/layers.26/self_attn/k_proj/Linear/post_convert", "/layers.26/self_attn/v_proj/Linear/pre_reshape", "/layers.26/self_attn/v_proj/Linear/pre_convert", "/layers.26/self_attn/v_proj/Linear", "/layers.26/self_attn/v_proj/Linear/post_convert", "/layers.26/self_attn/o_proj/Linear/pre_reshape", "/layers.26/self_attn/o_proj/Linear/pre_convert", "/layers.26/self_attn/o_proj/Linear", "/layers.26/self_attn/o_proj/Linear/post_convert", "/layers.26/mlp/gate_proj/Linear/pre_reshape", "/layers.26/mlp/gate_proj/Linear/pre_convert", "/layers.26/mlp/gate_proj/Linear", "/layers.26/mlp/gate_proj/Linear/post_convert", "/layers.26/mlp/up_proj/Linear/pre_reshape", "/layers.26/mlp/up_proj/Linear/pre_convert", "/layers.26/mlp/up_proj/Linear", "/layers.26/mlp/up_proj/Linear/post_convert", "/layers.26/mlp/down_proj/Linear/pre_reshape", "/layers.26/mlp/down_proj/Linear/pre_convert", "/layers.26/mlp/down_proj/Linear", "/layers.26/mlp/down_proj/Linear/post_convert", "/layers.27/self_attn/q_proj/Linear/pre_reshape", "/layers.27/self_attn/q_proj/Linear/pre_convert", "/layers.27/self_attn/q_proj/Linear", "/layers.27/self_attn/q_proj/Linear/post_convert", "/layers.27/self_attn/k_proj/Linear/pre_reshape", "/layers.27/self_attn/k_proj/Linear/pre_convert", "/layers.27/self_attn/k_proj/Linear", "/layers.27/self_attn/k_proj/Linear/post_convert", "/layers.27/self_attn/v_proj/Linear/pre_reshape", "/layers.27/self_attn/v_proj/Linear/pre_convert", "/layers.27/self_attn/v_proj/Linear", "/layers.27/self_attn/v_proj/Linear/post_convert", "/layers.27/self_attn/o_proj/Linear/pre_reshape", "/layers.27/self_attn/o_proj/Linear/pre_convert", "/layers.27/self_attn/o_proj/Linear", "/layers.27/self_attn/o_proj/Linear/post_convert", "/layers.27/mlp/gate_proj/Linear/pre_reshape", "/layers.27/mlp/gate_proj/Linear/pre_convert", "/layers.27/mlp/gate_proj/Linear", "/layers.27/mlp/gate_proj/Linear/post_convert", "/layers.27/mlp/up_proj/Linear/pre_reshape", "/layers.27/mlp/up_proj/Linear/pre_convert", "/layers.27/mlp/up_proj/Linear", "/layers.27/mlp/up_proj/Linear/post_convert", "/layers.27/mlp/down_proj/Linear/pre_reshape", "/layers.27/mlp/down_proj/Linear/pre_convert", "/layers.27/mlp/down_proj/Linear", "/layers.27/mlp/down_proj/Linear/post_convert", "/layers.28/self_attn/q_proj/Linear/pre_reshape", "/layers.28/self_attn/q_proj/Linear/pre_convert", "/layers.28/self_attn/q_proj/Linear", "/layers.28/self_attn/q_proj/Linear/post_convert", "/layers.28/self_attn/k_proj/Linear/pre_reshape", "/layers.28/self_attn/k_proj/Linear/pre_convert", "/layers.28/self_attn/k_proj/Linear", "/layers.28/self_attn/k_proj/Linear/post_convert", "/layers.28/self_attn/v_proj/Linear/pre_reshape", "/layers.28/self_attn/v_proj/Linear/pre_convert", "/layers.28/self_attn/v_proj/Linear", "/layers.28/self_attn/v_proj/Linear/post_convert", "/layers.28/self_attn/o_proj/Linear/pre_reshape", "/layers.28/self_attn/o_proj/Linear/pre_convert", "/layers.28/self_attn/o_proj/Linear", "/layers.28/self_attn/o_proj/Linear/post_convert", "/layers.28/mlp/gate_proj/Linear/pre_reshape", "/layers.28/mlp/gate_proj/Linear/pre_convert", "/layers.28/mlp/gate_proj/Linear", "/layers.28/mlp/gate_proj/Linear/post_convert", "/layers.28/mlp/up_proj/Linear/pre_reshape", "/layers.28/mlp/up_proj/Linear/pre_convert", "/layers.28/mlp/up_proj/Linear", "/layers.28/mlp/up_proj/Linear/post_convert", "/layers.28/mlp/down_proj/Linear/pre_reshape", "/layers.28/mlp/down_proj/Linear/pre_convert", "/layers.28/mlp/down_proj/Linear", "/layers.28/mlp/down_proj/Linear/post_convert", "/layers.29/self_attn/q_proj/Linear/pre_reshape", "/layers.29/self_attn/q_proj/Linear/pre_convert", "/layers.29/self_attn/q_proj/Linear", "/layers.29/self_attn/q_proj/Linear/post_convert", "/layers.29/self_attn/k_proj/Linear/pre_reshape", "/layers.29/self_attn/k_proj/Linear/pre_convert", "/layers.29/self_attn/k_proj/Linear", "/layers.29/self_attn/k_proj/Linear/post_convert", "/layers.29/self_attn/v_proj/Linear/pre_reshape", "/layers.29/self_attn/v_proj/Linear/pre_convert", "/layers.29/self_attn/v_proj/Linear", "/layers.29/self_attn/v_proj/Linear/post_convert", "/layers.29/self_attn/o_proj/Linear/pre_reshape", "/layers.29/self_attn/o_proj/Linear/pre_convert", "/layers.29/self_attn/o_proj/Linear", "/layers.29/self_attn/o_proj/Linear/post_convert", "/layers.29/mlp/gate_proj/Linear/pre_reshape", "/layers.29/mlp/gate_proj/Linear/pre_convert", "/layers.29/mlp/gate_proj/Linear", "/layers.29/mlp/gate_proj/Linear/post_convert", "/layers.29/mlp/up_proj/Linear/pre_reshape", "/layers.29/mlp/up_proj/Linear/pre_convert", "/layers.29/mlp/up_proj/Linear", "/layers.29/mlp/up_proj/Linear/post_convert", "/layers.29/mlp/down_proj/Linear/pre_reshape", "/layers.29/mlp/down_proj/Linear/pre_convert", "/layers.29/mlp/down_proj/Linear", "/layers.29/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "sourceType": "ONNX", "bizCode": "MNNTest", "outputName": [ "logits", "presents" ] , "tensorNumber": 0, "extraInfo": { "version": "3.1.2" } , "preferForwardType": "CPU", "usage": "INFERENCE", "mnn_uuid": "7d09aa4a-7e0d-46ad-9f80-d7aeaa0d6269" }