{ "bizCode": "MNNTest", "extraInfo": { "version": "3.1.4" } , "oplists": [ { "main_type": "Input", "main": { "dims": [ 1, 1, 896 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "input_ids", "outputIndexes": [ 2 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, 1, -1, -1 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "attention_mask", "outputIndexes": [ 124 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1, -1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "position_ids", "outputIndexes": [ 34 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 24, 2, 1, -1, 2, 64 ] , "dtype": "DT_FLOAT", "dformat": "NCHW" } , "name": "past_key_values", "outputIndexes": [ 0 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "main_type": "Input", "main": { "dims": [ 1 ] , "dtype": "DT_INT32", "dformat": "NCHW" } , "name": "logits_index", "outputIndexes": [ 2182 ] , "type": "Input", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 0 ] , "main_type": "Reshape", "main": { "dims": [ -1 ] , "dimType": "NCHW" } , "name": "presents", "outputIndexes": [ 1 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 3 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1, -1, 896 ] } , "name": "/Constant_output_0", "outputIndexes": [ 3 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_output_0", "outputIndexes": [ 4 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 0, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm/Mul_1_output_0", "outputIndexes": [ 5 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2186 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2186 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2187 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 7168, 401430, 100352, 3584, 0 ] } , "name": "/layers.0/self_attn/q_proj/Linear", "outputIndexes": [ 2188 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2188 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2189 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2189 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 6 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 5 ] , "main_type": "NONE", "name": "/Shape_output_0", "outputIndexes": [ 7 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Shape51", "outputIndexes": [ 8 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 7 ] , "main_type": "NONE", "name": "Rank53", "outputIndexes": [ 9 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 9, 9 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp55", "outputIndexes": [ 10 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze56", "outputIndexes": [ 11 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Const9", "outputIndexes": [ 12 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp58", "outputIndexes": [ 13 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze59", "outputIndexes": [ 14 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1 ] } , "name": "Unsqueeze61", "outputIndexes": [ 15 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 11, 14, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice62", "outputIndexes": [ 16 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 16 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze63", "outputIndexes": [ 17 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 17, 17 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp65", "outputIndexes": [ 18 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 18, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_1_output_0", "outputIndexes": [ 19 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 0 ] } , "name": "/rotary/Constant_4_output_0", "outputIndexes": [ 20 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_output_0", "outputIndexes": [ 21 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 10 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze75", "outputIndexes": [ 22 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 13 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze78", "outputIndexes": [ 23 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 8, 22, 23, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice81", "outputIndexes": [ 24 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 24 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze82", "outputIndexes": [ 25 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 25 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp83", "outputIndexes": [ 26 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 26, 25 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp84", "outputIndexes": [ 27 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 7, 27, 10 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_2_output_0", "outputIndexes": [ 28 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_1_output_0", "outputIndexes": [ 29 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 14 ] } , "name": "/Constant_4_output_0", "outputIndexes": [ 30 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 64 ] } , "name": "/Constant_5_output_0", "outputIndexes": [ 31 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 21, 29, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_output_0", "outputIndexes": [ 32 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 6, 32 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_1_output_0", "outputIndexes": [ 33 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 34 ] , "main_type": "CastParam", "main": { "srcT": "DT_VARIANT", "dstT": "DT_FLOAT" } , "name": "/rotary/Cast_output_0", "outputIndexes": [ 35 ] , "type": "Cast", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 2 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ -1, 1 ] } , "name": "/rotary/Constant_1_output_0", "outputIndexes": [ 36 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 35, 36 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/rotary/Reshape_output_0", "outputIndexes": [ 37 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 32 ] , "dataFormat": "NCHW", "dataType": "DT_FLOAT", "float32s": [ 1.0, 0.649382, 0.421697, 0.273842, 0.177828, 0.115478, 0.074989, 0.048697, 0.031623, 0.020535, 0.013335, 0.00866, 0.005623, 0.003652, 0.002371, 0.00154, 0.001, 0.000649, 0.000422, 0.000274, 0.000178, 0.000115, 0.000075, 0.000049, 0.000032, 0.000021, 0.000013, 0.000009, 0.000006, 0.000004, 0.000002, 0.000002 ] } , "name": "/rotary/Constant_2_output_0", "outputIndexes": [ 38 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 37, 38 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/rotary/Mul_output_0", "outputIndexes": [ 39 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 39 ] , "main_type": "UnaryOp", "main": { "opType": "COS", "T": "DT_FLOAT" } , "name": "/rotary/Cos_output_0", "outputIndexes": [ 40 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 40, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_output_0", "outputIndexes": [ 41 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 39 ] , "main_type": "UnaryOp", "main": { "opType": "SIN", "T": "DT_FLOAT" } , "name": "/rotary/Sin_output_0", "outputIndexes": [ 42 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 42, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_1_output_0", "outputIndexes": [ 43 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 41, 43 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/rotary/Concat_output_0", "outputIndexes": [ 44 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 44, 44 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/rotary/Concat_1_output_0", "outputIndexes": [ 45 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_7_output_0", "outputIndexes": [ 46 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 45, 46 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_2_output_0", "outputIndexes": [ 47 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 47, 15 ] , "main_type": "SqueezeParam", "main": { } , "name": "/rotary/Unsqueeze_3_output_0", "outputIndexes": [ 48 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48 ] , "main_type": "NONE", "name": "Shape106", "outputIndexes": [ 49 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 48 ] , "main_type": "NONE", "name": "Rank108", "outputIndexes": [ 50 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 50, 50 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp110", "outputIndexes": [ 51 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze111", "outputIndexes": [ 52 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp113", "outputIndexes": [ 53 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze114", "outputIndexes": [ 54 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 52, 54, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice117", "outputIndexes": [ 55 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 55 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze118", "outputIndexes": [ 56 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 56, 56 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp120", "outputIndexes": [ 57 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 57, 51 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_3_output_0", "outputIndexes": [ 58 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_output_0", "outputIndexes": [ 59 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33 ] , "main_type": "NONE", "name": "/Shape_2_output_0", "outputIndexes": [ 60 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/Constant_10_output_0", "outputIndexes": [ 61 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60 ] , "main_type": "NONE", "name": "Shape238", "outputIndexes": [ 62 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 60 ] , "main_type": "NONE", "name": "Rank240", "outputIndexes": [ 63 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 63, 63 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp242", "outputIndexes": [ 64 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 64 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze243", "outputIndexes": [ 65 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 64, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp245", "outputIndexes": [ 66 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 66 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze246", "outputIndexes": [ 67 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 62, 65, 67, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice249", "outputIndexes": [ 68 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 68 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze250", "outputIndexes": [ 69 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 69 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp251", "outputIndexes": [ 70 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 70, 69 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp252", "outputIndexes": [ 71 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 60, 71, 64 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_5_output_0", "outputIndexes": [ 72 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 2 ] } , "name": "/rotary/Constant_6_output_0", "outputIndexes": [ 73 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 72, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_output_0", "outputIndexes": [ 74 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 74, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_7_output_0", "outputIndexes": [ 75 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 1073741824 ] } , "name": "/Constant_19_output_0", "outputIndexes": [ 76 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "main_type": "Blob", "main": { "dims": [ 1 ] , "dataFormat": "NCHW", "dataType": "DT_INT32", "int32s": [ 3 ] } , "name": "/Constant_13_output_0", "outputIndexes": [ 77 ] , "type": "Const", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 75, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_1_output_0", "outputIndexes": [ 78 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 78 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_output_0", "outputIndexes": [ 79 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 74, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_6_output_0", "outputIndexes": [ 80 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 33, 20, 80, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_output_0", "outputIndexes": [ 81 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 79, 81 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_3_output_0", "outputIndexes": [ 82 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 51 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze157", "outputIndexes": [ 83 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 53 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze160", "outputIndexes": [ 84 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 49, 83, 84, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice163", "outputIndexes": [ 85 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 85 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze164", "outputIndexes": [ 86 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 86 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp165", "outputIndexes": [ 87 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 87, 86 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp166", "outputIndexes": [ 88 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 48, 88, 51 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_4_output_0", "outputIndexes": [ 89 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 82, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_1_output_0", "outputIndexes": [ 90 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 59, 90 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_output_0", "outputIndexes": [ 91 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 512534, 57366, 14336, 512, 0 ] } , "name": "/layers.0/self_attn/k_proj/Linear", "outputIndexes": [ 2192 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2192 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2193 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2193 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 92 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_2_output_0", "outputIndexes": [ 93 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_3_output_0", "outputIndexes": [ 94 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 93, 94, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_1_output_0", "outputIndexes": [ 95 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 92, 95 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_2_output_0", "outputIndexes": [ 96 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_2_output_0", "outputIndexes": [ 97 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96 ] , "main_type": "NONE", "name": "/Shape_3_output_0", "outputIndexes": [ 98 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 98 ] , "main_type": "NONE", "name": "Shape125", "outputIndexes": [ 99 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 98 ] , "main_type": "NONE", "name": "Rank127", "outputIndexes": [ 100 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 100, 100 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp129", "outputIndexes": [ 101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze130", "outputIndexes": [ 102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 101, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp132", "outputIndexes": [ 103 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 103 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze133", "outputIndexes": [ 104 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 99, 102, 104, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice136", "outputIndexes": [ 105 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 105 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze137", "outputIndexes": [ 106 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 106 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp138", "outputIndexes": [ 107 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 107, 106 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp139", "outputIndexes": [ 108 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 98, 108, 101 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_6_output_0", "outputIndexes": [ 109 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 109, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_1_output_0", "outputIndexes": [ 110 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 110, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_9_output_0", "outputIndexes": [ 111 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 111, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_3_output_0", "outputIndexes": [ 112 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 112 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_1_output_0", "outputIndexes": [ 113 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 110, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_8_output_0", "outputIndexes": [ 114 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 96, 20, 114, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_2_output_0", "outputIndexes": [ 115 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 113, 115 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_4_output_0", "outputIndexes": [ 116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 116, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_3_output_0", "outputIndexes": [ 117 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 97, 117 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_1_output_0", "outputIndexes": [ 118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2187 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 584748, 57366, 14336, 512, 0 ] } , "name": "/layers.0/self_attn/v_proj/Linear", "outputIndexes": [ 2196 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2196 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2197 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2197 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 119 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 19, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_4_output_0", "outputIndexes": [ 120 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 28, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_5_output_0", "outputIndexes": [ 121 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 120, 121, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_2_output_0", "outputIndexes": [ 122 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 119, 122 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_3_output_0", "outputIndexes": [ 123 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 91, 118, 123, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_8_output_0", "outputIndexes": [ 125 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 125 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2198 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2198 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2199 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2199 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 656962, 401430, 100352, 0, 0 ] } , "name": "/layers.0/self_attn/o_proj/Linear", "outputIndexes": [ 2200 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2200 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2201 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2201 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.0/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 126 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 4, 126 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_3_output_0", "outputIndexes": [ 127 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 1158744, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm/Mul_1_output_0", "outputIndexes": [ 128 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 128 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2202 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2202 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2203 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 1165912, 2179094, 544768, 0, 0 ] } , "name": "/layers.0/mlp/gate_proj/Linear", "outputIndexes": [ 2204 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2204 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2205 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2205 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 129 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 129 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn/Mul_output_0", "outputIndexes": [ 130 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2203 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 3889774, 2179094, 544768, 0, 0 ] } , "name": "/layers.0/mlp/up_proj/Linear", "outputIndexes": [ 2208 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2208 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2209 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2209 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 131 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 130, 131 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp/Mul_output_0", "outputIndexes": [ 132 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 132 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2210 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2210 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.0/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2211 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2211 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 6613636, 2179094, 544768, 0, 0 ] } , "name": "/layers.0/mlp/down_proj/Linear", "outputIndexes": [ 2212 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2212 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2213 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2213 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.0/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 133 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 127, 133 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_4_output_0", "outputIndexes": [ 134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 134, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_9_output_0", "outputIndexes": [ 135 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 9337498, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_1/Mul_1_output_0", "outputIndexes": [ 136 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2214 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2214 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2215 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9344666, 401430, 100352, 3584, 0 ] } , "name": "/layers.1/self_attn/q_proj/Linear", "outputIndexes": [ 2216 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2216 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2217 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2217 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 137 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 136 ] , "main_type": "NONE", "name": "/Shape_14_output_0", "outputIndexes": [ 138 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 138 ] , "main_type": "NONE", "name": "Shape483", "outputIndexes": [ 139 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 138 ] , "main_type": "NONE", "name": "Rank485", "outputIndexes": [ 140 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 140, 140 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp487", "outputIndexes": [ 141 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze488", "outputIndexes": [ 142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp490", "outputIndexes": [ 143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze491", "outputIndexes": [ 144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 142, 144, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice494", "outputIndexes": [ 145 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 145 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze495", "outputIndexes": [ 146 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 146, 146 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp497", "outputIndexes": [ 147 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 147, 141 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_18_output_0", "outputIndexes": [ 148 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_32_output_0", "outputIndexes": [ 149 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 141 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze505", "outputIndexes": [ 150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze508", "outputIndexes": [ 151 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 139, 150, 151, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice511", "outputIndexes": [ 152 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 152 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze512", "outputIndexes": [ 153 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 153 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp513", "outputIndexes": [ 154 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 154, 153 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp514", "outputIndexes": [ 155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 138, 155, 141 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_19_output_0", "outputIndexes": [ 156 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_33_output_0", "outputIndexes": [ 157 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 149, 157, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_13_output_0", "outputIndexes": [ 158 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 137, 158 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_10_output_0", "outputIndexes": [ 159 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_8_output_0", "outputIndexes": [ 160 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159 ] , "main_type": "NONE", "name": "/Shape_16_output_0", "outputIndexes": [ 161 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 161 ] , "main_type": "NONE", "name": "Shape614", "outputIndexes": [ 162 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 161 ] , "main_type": "NONE", "name": "Rank616", "outputIndexes": [ 163 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 163, 163 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp618", "outputIndexes": [ 164 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze619", "outputIndexes": [ 165 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 164, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp621", "outputIndexes": [ 166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 166 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze622", "outputIndexes": [ 167 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 162, 165, 167, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice625", "outputIndexes": [ 168 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 168 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze626", "outputIndexes": [ 169 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 169 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp627", "outputIndexes": [ 170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 170, 169 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp628", "outputIndexes": [ 171 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 161, 171, 164 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_20_output_0", "outputIndexes": [ 172 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 172, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_3_output_0", "outputIndexes": [ 173 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_39_output_0", "outputIndexes": [ 174 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 174, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_5_output_0", "outputIndexes": [ 175 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 175 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_2_output_0", "outputIndexes": [ 176 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 173, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_38_output_0", "outputIndexes": [ 177 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 159, 20, 177, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_4_output_0", "outputIndexes": [ 178 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 176, 178 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_16_output_0", "outputIndexes": [ 179 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 179, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_9_output_0", "outputIndexes": [ 180 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 160, 180 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_5_output_0", "outputIndexes": [ 181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9850032, 57366, 14336, 512, 0 ] } , "name": "/layers.1/self_attn/k_proj/Linear", "outputIndexes": [ 2220 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2220 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2221 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2221 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 182 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_34_output_0", "outputIndexes": [ 183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_35_output_0", "outputIndexes": [ 184 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 183, 184, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_14_output_0", "outputIndexes": [ 185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 182, 185 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_11_output_0", "outputIndexes": [ 186 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_10_output_0", "outputIndexes": [ 187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186 ] , "main_type": "NONE", "name": "/Shape_17_output_0", "outputIndexes": [ 188 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 188 ] , "main_type": "NONE", "name": "Shape521", "outputIndexes": [ 189 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 188 ] , "main_type": "NONE", "name": "Rank523", "outputIndexes": [ 190 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 190, 190 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp525", "outputIndexes": [ 191 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze526", "outputIndexes": [ 192 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 191, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp528", "outputIndexes": [ 193 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 193 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze529", "outputIndexes": [ 194 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 189, 192, 194, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice532", "outputIndexes": [ 195 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 195 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze533", "outputIndexes": [ 196 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 196 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp534", "outputIndexes": [ 197 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 197, 196 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp535", "outputIndexes": [ 198 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 188, 198, 191 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_21_output_0", "outputIndexes": [ 199 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 199, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_4_output_0", "outputIndexes": [ 200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 200, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_41_output_0", "outputIndexes": [ 201 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 201, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_7_output_0", "outputIndexes": [ 202 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 202 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_3_output_0", "outputIndexes": [ 203 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 200, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_40_output_0", "outputIndexes": [ 204 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 186, 20, 204, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_6_output_0", "outputIndexes": [ 205 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 203, 205 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_17_output_0", "outputIndexes": [ 206 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 206, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_11_output_0", "outputIndexes": [ 207 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 187, 207 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_6_output_0", "outputIndexes": [ 208 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2215 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9922246, 57366, 14336, 512, 0 ] } , "name": "/layers.1/self_attn/v_proj/Linear", "outputIndexes": [ 2224 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2224 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2225 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2225 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 209 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 148, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_36_output_0", "outputIndexes": [ 210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 156, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_37_output_0", "outputIndexes": [ 211 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 210, 211, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_15_output_0", "outputIndexes": [ 212 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 209, 212 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_12_output_0", "outputIndexes": [ 213 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 181, 208, 213, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_17_output_0", "outputIndexes": [ 214 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 214 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2226 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2226 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2227 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2227 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 9994460, 401430, 100352, 0, 0 ] } , "name": "/layers.1/self_attn/o_proj/Linear", "outputIndexes": [ 2228 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2228 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2229 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2229 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.1/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 215 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 135, 215 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_8_output_0", "outputIndexes": [ 216 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 10496242, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_1/Mul_1_output_0", "outputIndexes": [ 217 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 217 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2230 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2230 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2231 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2231 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 10503410, 2179094, 544768, 0, 0 ] } , "name": "/layers.1/mlp/gate_proj/Linear", "outputIndexes": [ 2232 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2232 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2233 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2233 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 218 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 218 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_1/Mul_output_0", "outputIndexes": [ 219 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2231 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 13227272, 2179094, 544768, 0, 0 ] } , "name": "/layers.1/mlp/up_proj/Linear", "outputIndexes": [ 2236 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2236 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2237 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2237 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 220 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 219, 220 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_1/Mul_output_0", "outputIndexes": [ 221 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 221 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2238 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2238 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.1/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2239 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2239 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 15951134, 2179094, 544768, 0, 0 ] } , "name": "/layers.1/mlp/down_proj/Linear", "outputIndexes": [ 2240 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2240 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2241 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2241 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.1/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 222 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 216, 222 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_9_output_0", "outputIndexes": [ 223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 223, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_18_output_0", "outputIndexes": [ 224 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 18674996, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_2/Mul_1_output_0", "outputIndexes": [ 225 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2242 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2242 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2243 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2243 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 18682164, 401430, 100352, 3584, 0 ] } , "name": "/layers.2/self_attn/q_proj/Linear", "outputIndexes": [ 2244 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2244 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2245 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2245 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 226 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 225 ] , "main_type": "NONE", "name": "/Shape_28_output_0", "outputIndexes": [ 227 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 227 ] , "main_type": "NONE", "name": "Shape853", "outputIndexes": [ 228 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 227 ] , "main_type": "NONE", "name": "Rank855", "outputIndexes": [ 229 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 229, 229 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp857", "outputIndexes": [ 230 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze858", "outputIndexes": [ 231 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp860", "outputIndexes": [ 232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze861", "outputIndexes": [ 233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 231, 233, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice864", "outputIndexes": [ 234 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 234 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze865", "outputIndexes": [ 235 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 235, 235 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp867", "outputIndexes": [ 236 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227, 236, 230 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_33_output_0", "outputIndexes": [ 237 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_64_output_0", "outputIndexes": [ 238 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 230 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze875", "outputIndexes": [ 239 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze878", "outputIndexes": [ 240 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 228, 239, 240, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice881", "outputIndexes": [ 241 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 241 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze882", "outputIndexes": [ 242 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 242 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp883", "outputIndexes": [ 243 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 243, 242 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp884", "outputIndexes": [ 244 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 227, 244, 230 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_34_output_0", "outputIndexes": [ 245 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_65_output_0", "outputIndexes": [ 246 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 238, 246, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_26_output_0", "outputIndexes": [ 247 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 226, 247 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_19_output_0", "outputIndexes": [ 248 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_16_output_0", "outputIndexes": [ 249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248 ] , "main_type": "NONE", "name": "/Shape_30_output_0", "outputIndexes": [ 250 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "Shape984", "outputIndexes": [ 251 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 250 ] , "main_type": "NONE", "name": "Rank986", "outputIndexes": [ 252 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 252, 252 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp988", "outputIndexes": [ 253 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze989", "outputIndexes": [ 254 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 253, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp991", "outputIndexes": [ 255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 255 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze992", "outputIndexes": [ 256 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 251, 254, 256, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice995", "outputIndexes": [ 257 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 257 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze996", "outputIndexes": [ 258 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 258 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp997", "outputIndexes": [ 259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 259, 258 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp998", "outputIndexes": [ 260 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 250, 260, 253 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_35_output_0", "outputIndexes": [ 261 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 261, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_6_output_0", "outputIndexes": [ 262 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_71_output_0", "outputIndexes": [ 263 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 263, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_9_output_0", "outputIndexes": [ 264 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 264 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_4_output_0", "outputIndexes": [ 265 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 262, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_70_output_0", "outputIndexes": [ 266 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 248, 20, 266, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_8_output_0", "outputIndexes": [ 267 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 265, 267 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_29_output_0", "outputIndexes": [ 268 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 268, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_17_output_0", "outputIndexes": [ 269 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 249, 269 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_10_output_0", "outputIndexes": [ 270 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2243 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19187530, 57366, 14336, 512, 0 ] } , "name": "/layers.2/self_attn/k_proj/Linear", "outputIndexes": [ 2248 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2248 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2249 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2249 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 271 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_66_output_0", "outputIndexes": [ 272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_67_output_0", "outputIndexes": [ 273 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 272, 273, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_27_output_0", "outputIndexes": [ 274 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 271, 274 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_20_output_0", "outputIndexes": [ 275 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_18_output_0", "outputIndexes": [ 276 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275 ] , "main_type": "NONE", "name": "/Shape_31_output_0", "outputIndexes": [ 277 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 277 ] , "main_type": "NONE", "name": "Shape891", "outputIndexes": [ 278 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 277 ] , "main_type": "NONE", "name": "Rank893", "outputIndexes": [ 279 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 279, 279 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp895", "outputIndexes": [ 280 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze896", "outputIndexes": [ 281 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 280, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp898", "outputIndexes": [ 282 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 282 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze899", "outputIndexes": [ 283 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 278, 281, 283, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice902", "outputIndexes": [ 284 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 284 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze903", "outputIndexes": [ 285 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 285 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp904", "outputIndexes": [ 286 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 286, 285 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp905", "outputIndexes": [ 287 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 277, 287, 280 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_36_output_0", "outputIndexes": [ 288 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 288, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_7_output_0", "outputIndexes": [ 289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_73_output_0", "outputIndexes": [ 290 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 290, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_11_output_0", "outputIndexes": [ 291 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 291 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_5_output_0", "outputIndexes": [ 292 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 289, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_72_output_0", "outputIndexes": [ 293 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 275, 20, 293, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_10_output_0", "outputIndexes": [ 294 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 292, 294 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_30_output_0", "outputIndexes": [ 295 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 295, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_19_output_0", "outputIndexes": [ 296 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 276, 296 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_11_output_0", "outputIndexes": [ 297 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2243 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19259744, 57366, 14336, 512, 0 ] } , "name": "/layers.2/self_attn/v_proj/Linear", "outputIndexes": [ 2252 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2252 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2253 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2253 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 298 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 237, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_68_output_0", "outputIndexes": [ 299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 245, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_69_output_0", "outputIndexes": [ 300 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 299, 300, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_28_output_0", "outputIndexes": [ 301 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 298, 301 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_21_output_0", "outputIndexes": [ 302 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 270, 297, 302, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_26_output_0", "outputIndexes": [ 303 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 303 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2254 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2254 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2255 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2255 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19331958, 401430, 100352, 0, 0 ] } , "name": "/layers.2/self_attn/o_proj/Linear", "outputIndexes": [ 2256 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2256 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2257 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2257 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.2/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 304 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 224, 304 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_13_output_0", "outputIndexes": [ 305 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 305 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 19833740, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_2/Mul_1_output_0", "outputIndexes": [ 306 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 306 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2258 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2258 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2259 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2259 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 19840908, 2179094, 544768, 0, 0 ] } , "name": "/layers.2/mlp/gate_proj/Linear", "outputIndexes": [ 2260 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2260 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2261 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2261 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 307 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 307 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_2/Mul_output_0", "outputIndexes": [ 308 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2259 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 22564770, 2179094, 544768, 0, 0 ] } , "name": "/layers.2/mlp/up_proj/Linear", "outputIndexes": [ 2264 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2264 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2265 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2265 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 309 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 308, 309 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_2/Mul_output_0", "outputIndexes": [ 310 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 310 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2266 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2266 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.2/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2267 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2267 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 25288632, 2179094, 544768, 0, 0 ] } , "name": "/layers.2/mlp/down_proj/Linear", "outputIndexes": [ 2268 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2268 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2269 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2269 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.2/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 311 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 305, 311 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_14_output_0", "outputIndexes": [ 312 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 312, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_27_output_0", "outputIndexes": [ 313 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 313 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 28012494, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_3/Mul_1_output_0", "outputIndexes": [ 314 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2270 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2270 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2271 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28019662, 401430, 100352, 3584, 0 ] } , "name": "/layers.3/self_attn/q_proj/Linear", "outputIndexes": [ 2272 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2272 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2273 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2273 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 315 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 314 ] , "main_type": "NONE", "name": "/Shape_42_output_0", "outputIndexes": [ 316 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 316 ] , "main_type": "NONE", "name": "Shape1223", "outputIndexes": [ 317 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 316 ] , "main_type": "NONE", "name": "Rank1225", "outputIndexes": [ 318 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 318, 318 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1227", "outputIndexes": [ 319 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1228", "outputIndexes": [ 320 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1230", "outputIndexes": [ 321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1231", "outputIndexes": [ 322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 320, 322, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1234", "outputIndexes": [ 323 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 323 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1235", "outputIndexes": [ 324 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 324, 324 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1237", "outputIndexes": [ 325 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316, 325, 319 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_48_output_0", "outputIndexes": [ 326 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_96_output_0", "outputIndexes": [ 327 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 319 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1245", "outputIndexes": [ 328 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1248", "outputIndexes": [ 329 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 317, 328, 329, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1251", "outputIndexes": [ 330 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 330 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1252", "outputIndexes": [ 331 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 331 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1253", "outputIndexes": [ 332 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 332, 331 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1254", "outputIndexes": [ 333 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 316, 333, 319 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_49_output_0", "outputIndexes": [ 334 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_97_output_0", "outputIndexes": [ 335 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 327, 335, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_39_output_0", "outputIndexes": [ 336 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 315, 336 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_28_output_0", "outputIndexes": [ 337 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_24_output_0", "outputIndexes": [ 338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337 ] , "main_type": "NONE", "name": "/Shape_44_output_0", "outputIndexes": [ 339 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 339 ] , "main_type": "NONE", "name": "Shape1355", "outputIndexes": [ 340 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 339 ] , "main_type": "NONE", "name": "Rank1357", "outputIndexes": [ 341 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 341, 341 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1359", "outputIndexes": [ 342 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1360", "outputIndexes": [ 343 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 342, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1362", "outputIndexes": [ 344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 344 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1363", "outputIndexes": [ 345 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 340, 343, 345, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1366", "outputIndexes": [ 346 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 346 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1367", "outputIndexes": [ 347 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 347 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1368", "outputIndexes": [ 348 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 348, 347 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1369", "outputIndexes": [ 349 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 339, 349, 342 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_50_output_0", "outputIndexes": [ 350 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 350, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_9_output_0", "outputIndexes": [ 351 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_103_output_0", "outputIndexes": [ 352 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 352, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_13_output_0", "outputIndexes": [ 353 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 353 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_6_output_0", "outputIndexes": [ 354 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 351, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_102_output_0", "outputIndexes": [ 355 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 337, 20, 355, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_12_output_0", "outputIndexes": [ 356 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 354, 356 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_42_output_0", "outputIndexes": [ 357 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 357, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_25_output_0", "outputIndexes": [ 358 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 338, 358 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_15_output_0", "outputIndexes": [ 359 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28525028, 57366, 14336, 512, 0 ] } , "name": "/layers.3/self_attn/k_proj/Linear", "outputIndexes": [ 2276 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2276 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2277 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2277 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 360 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_98_output_0", "outputIndexes": [ 361 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_99_output_0", "outputIndexes": [ 362 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 361, 362, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_40_output_0", "outputIndexes": [ 363 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 360, 363 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_29_output_0", "outputIndexes": [ 364 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_26_output_0", "outputIndexes": [ 365 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364 ] , "main_type": "NONE", "name": "/Shape_45_output_0", "outputIndexes": [ 366 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 366 ] , "main_type": "NONE", "name": "Shape1261", "outputIndexes": [ 367 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 366 ] , "main_type": "NONE", "name": "Rank1263", "outputIndexes": [ 368 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 368, 368 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1265", "outputIndexes": [ 369 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1266", "outputIndexes": [ 370 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 369, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1268", "outputIndexes": [ 371 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 371 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1269", "outputIndexes": [ 372 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 367, 370, 372, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1272", "outputIndexes": [ 373 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 373 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1273", "outputIndexes": [ 374 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 374 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1274", "outputIndexes": [ 375 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 375, 374 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1275", "outputIndexes": [ 376 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 366, 376, 369 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_51_output_0", "outputIndexes": [ 377 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 377, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_10_output_0", "outputIndexes": [ 378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_105_output_0", "outputIndexes": [ 379 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 379, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_15_output_0", "outputIndexes": [ 380 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 380 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_7_output_0", "outputIndexes": [ 381 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 378, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_104_output_0", "outputIndexes": [ 382 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 364, 20, 382, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_14_output_0", "outputIndexes": [ 383 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 381, 383 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_43_output_0", "outputIndexes": [ 384 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 384, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_27_output_0", "outputIndexes": [ 385 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 365, 385 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_16_output_0", "outputIndexes": [ 386 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2271 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28597242, 57366, 14336, 512, 0 ] } , "name": "/layers.3/self_attn/v_proj/Linear", "outputIndexes": [ 2280 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2280 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2281 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2281 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 387 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 326, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_100_output_0", "outputIndexes": [ 388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 334, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_101_output_0", "outputIndexes": [ 389 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 388, 389, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_41_output_0", "outputIndexes": [ 390 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 387, 390 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_30_output_0", "outputIndexes": [ 391 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 359, 386, 391, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_35_output_0", "outputIndexes": [ 392 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 392 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2282 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2282 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2283 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2283 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 28669456, 401430, 100352, 0, 0 ] } , "name": "/layers.3/self_attn/o_proj/Linear", "outputIndexes": [ 2284 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2284 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2285 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2285 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.3/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 393 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 313, 393 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_18_output_0", "outputIndexes": [ 394 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 29171238, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_3/Mul_1_output_0", "outputIndexes": [ 395 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 395 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2286 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2286 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2287 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2287 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 29178406, 2179094, 544768, 0, 0 ] } , "name": "/layers.3/mlp/gate_proj/Linear", "outputIndexes": [ 2288 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2288 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2289 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2289 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 396 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 396 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_3/Mul_output_0", "outputIndexes": [ 397 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2287 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 31902268, 2179094, 544768, 0, 0 ] } , "name": "/layers.3/mlp/up_proj/Linear", "outputIndexes": [ 2292 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2292 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2293 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2293 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 398 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 397, 398 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_3/Mul_output_0", "outputIndexes": [ 399 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 399 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2294 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2294 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.3/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2295 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2295 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 34626130, 2179094, 544768, 0, 0 ] } , "name": "/layers.3/mlp/down_proj/Linear", "outputIndexes": [ 2296 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2296 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2297 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2297 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.3/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 400 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 394, 400 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_19_output_0", "outputIndexes": [ 401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 401, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_36_output_0", "outputIndexes": [ 402 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 402 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 37349992, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_4/Mul_1_output_0", "outputIndexes": [ 403 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2298 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2298 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2299 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37357160, 401430, 100352, 3584, 0 ] } , "name": "/layers.4/self_attn/q_proj/Linear", "outputIndexes": [ 2300 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2300 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2301 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2301 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 404 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 403 ] , "main_type": "NONE", "name": "/Shape_56_output_0", "outputIndexes": [ 405 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 405 ] , "main_type": "NONE", "name": "Shape1594", "outputIndexes": [ 406 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 405 ] , "main_type": "NONE", "name": "Rank1596", "outputIndexes": [ 407 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 407, 407 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1598", "outputIndexes": [ 408 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1599", "outputIndexes": [ 409 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1601", "outputIndexes": [ 410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1602", "outputIndexes": [ 411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 406, 409, 411, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1605", "outputIndexes": [ 412 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 412 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1606", "outputIndexes": [ 413 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 413, 413 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1608", "outputIndexes": [ 414 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 414, 408 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_63_output_0", "outputIndexes": [ 415 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_128_output_0", "outputIndexes": [ 416 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 408 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1616", "outputIndexes": [ 417 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1619", "outputIndexes": [ 418 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 406, 417, 418, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1622", "outputIndexes": [ 419 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 419 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1623", "outputIndexes": [ 420 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 420 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1624", "outputIndexes": [ 421 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 421, 420 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1625", "outputIndexes": [ 422 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 405, 422, 408 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_64_output_0", "outputIndexes": [ 423 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_129_output_0", "outputIndexes": [ 424 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 416, 424, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_52_output_0", "outputIndexes": [ 425 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 404, 425 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_37_output_0", "outputIndexes": [ 426 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_32_output_0", "outputIndexes": [ 427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426 ] , "main_type": "NONE", "name": "/Shape_58_output_0", "outputIndexes": [ 428 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 428 ] , "main_type": "NONE", "name": "Shape1726", "outputIndexes": [ 429 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 428 ] , "main_type": "NONE", "name": "Rank1728", "outputIndexes": [ 430 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 430, 430 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1730", "outputIndexes": [ 431 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1731", "outputIndexes": [ 432 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 431, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1733", "outputIndexes": [ 433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 433 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1734", "outputIndexes": [ 434 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 429, 432, 434, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1737", "outputIndexes": [ 435 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 435 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1738", "outputIndexes": [ 436 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 436 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1739", "outputIndexes": [ 437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 437, 436 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1740", "outputIndexes": [ 438 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 428, 438, 431 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_65_output_0", "outputIndexes": [ 439 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 439, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_12_output_0", "outputIndexes": [ 440 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_135_output_0", "outputIndexes": [ 441 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 441, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_17_output_0", "outputIndexes": [ 442 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 442 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_8_output_0", "outputIndexes": [ 443 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 440, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_134_output_0", "outputIndexes": [ 444 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 426, 20, 444, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_16_output_0", "outputIndexes": [ 445 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 443, 445 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_55_output_0", "outputIndexes": [ 446 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 446, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_33_output_0", "outputIndexes": [ 447 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 427, 447 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_20_output_0", "outputIndexes": [ 448 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37862526, 57366, 14336, 512, 0 ] } , "name": "/layers.4/self_attn/k_proj/Linear", "outputIndexes": [ 2304 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2304 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2305 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2305 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 449 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_130_output_0", "outputIndexes": [ 450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_131_output_0", "outputIndexes": [ 451 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 450, 451, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_53_output_0", "outputIndexes": [ 452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 449, 452 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_38_output_0", "outputIndexes": [ 453 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_34_output_0", "outputIndexes": [ 454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453 ] , "main_type": "NONE", "name": "/Shape_59_output_0", "outputIndexes": [ 455 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 455 ] , "main_type": "NONE", "name": "Shape1632", "outputIndexes": [ 456 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 455 ] , "main_type": "NONE", "name": "Rank1634", "outputIndexes": [ 457 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 457, 457 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1636", "outputIndexes": [ 458 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1637", "outputIndexes": [ 459 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 458, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1639", "outputIndexes": [ 460 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 460 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1640", "outputIndexes": [ 461 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 456, 459, 461, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1643", "outputIndexes": [ 462 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 462 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1644", "outputIndexes": [ 463 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 463 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1645", "outputIndexes": [ 464 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 464, 463 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1646", "outputIndexes": [ 465 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 455, 465, 458 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_66_output_0", "outputIndexes": [ 466 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 466, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_13_output_0", "outputIndexes": [ 467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_137_output_0", "outputIndexes": [ 468 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 468, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_19_output_0", "outputIndexes": [ 469 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 469 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_9_output_0", "outputIndexes": [ 470 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 467, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_136_output_0", "outputIndexes": [ 471 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 453, 20, 471, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_18_output_0", "outputIndexes": [ 472 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 470, 472 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_56_output_0", "outputIndexes": [ 473 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 473, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_35_output_0", "outputIndexes": [ 474 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 454, 474 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_21_output_0", "outputIndexes": [ 475 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2299 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 37934740, 57366, 14336, 512, 0 ] } , "name": "/layers.4/self_attn/v_proj/Linear", "outputIndexes": [ 2308 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2308 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2309 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2309 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 476 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 415, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_132_output_0", "outputIndexes": [ 477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 423, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_133_output_0", "outputIndexes": [ 478 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 477, 478, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_54_output_0", "outputIndexes": [ 479 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 476, 479 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_39_output_0", "outputIndexes": [ 480 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 448, 475, 480, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_44_output_0", "outputIndexes": [ 481 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 481 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2310 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2310 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2311 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2311 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 38006954, 401430, 100352, 0, 0 ] } , "name": "/layers.4/self_attn/o_proj/Linear", "outputIndexes": [ 2312 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2312 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2313 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2313 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.4/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 482 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 402, 482 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_23_output_0", "outputIndexes": [ 483 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 38508736, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_4/Mul_1_output_0", "outputIndexes": [ 484 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 484 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2314 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2314 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2315 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 38515904, 2179094, 544768, 0, 0 ] } , "name": "/layers.4/mlp/gate_proj/Linear", "outputIndexes": [ 2316 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2316 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2317 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2317 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 485 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 485 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_4/Mul_output_0", "outputIndexes": [ 486 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2315 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 41239766, 2179094, 544768, 0, 0 ] } , "name": "/layers.4/mlp/up_proj/Linear", "outputIndexes": [ 2320 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2320 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2321 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2321 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 487 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 486, 487 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_4/Mul_output_0", "outputIndexes": [ 488 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 488 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2322 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2322 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.4/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2323 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2323 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 43963628, 2179094, 544768, 0, 0 ] } , "name": "/layers.4/mlp/down_proj/Linear", "outputIndexes": [ 2324 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2324 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2325 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2325 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.4/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 489 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 483, 489 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_24_output_0", "outputIndexes": [ 490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 490, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_45_output_0", "outputIndexes": [ 491 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 46687490, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_5/Mul_1_output_0", "outputIndexes": [ 492 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 492 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2326 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2326 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2327 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 46694658, 401430, 100352, 3584, 0 ] } , "name": "/layers.5/self_attn/q_proj/Linear", "outputIndexes": [ 2328 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2328 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2329 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2329 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 493 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 492 ] , "main_type": "NONE", "name": "/Shape_70_output_0", "outputIndexes": [ 494 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 494 ] , "main_type": "NONE", "name": "Shape1965", "outputIndexes": [ 495 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 494 ] , "main_type": "NONE", "name": "Rank1967", "outputIndexes": [ 496 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 496, 496 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1969", "outputIndexes": [ 497 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1970", "outputIndexes": [ 498 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1972", "outputIndexes": [ 499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1973", "outputIndexes": [ 500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 498, 500, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1976", "outputIndexes": [ 501 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 501 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1977", "outputIndexes": [ 502 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 502, 502 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1979", "outputIndexes": [ 503 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494, 503, 497 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_78_output_0", "outputIndexes": [ 504 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_160_output_0", "outputIndexes": [ 505 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 497 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1987", "outputIndexes": [ 506 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze1990", "outputIndexes": [ 507 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 495, 506, 507, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice1993", "outputIndexes": [ 508 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 508 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze1994", "outputIndexes": [ 509 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 509 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1995", "outputIndexes": [ 510 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 510, 509 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp1996", "outputIndexes": [ 511 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 494, 511, 497 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_79_output_0", "outputIndexes": [ 512 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_161_output_0", "outputIndexes": [ 513 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 505, 513, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_65_output_0", "outputIndexes": [ 514 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 493, 514 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_46_output_0", "outputIndexes": [ 515 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_40_output_0", "outputIndexes": [ 516 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515 ] , "main_type": "NONE", "name": "/Shape_72_output_0", "outputIndexes": [ 517 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 517 ] , "main_type": "NONE", "name": "Shape2097", "outputIndexes": [ 518 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 517 ] , "main_type": "NONE", "name": "Rank2099", "outputIndexes": [ 519 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 519, 519 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2101", "outputIndexes": [ 520 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2102", "outputIndexes": [ 521 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 520, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2104", "outputIndexes": [ 522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 522 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2105", "outputIndexes": [ 523 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 518, 521, 523, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2108", "outputIndexes": [ 524 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 524 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2109", "outputIndexes": [ 525 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 525 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2110", "outputIndexes": [ 526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 526, 525 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2111", "outputIndexes": [ 527 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 517, 527, 520 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_80_output_0", "outputIndexes": [ 528 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 528, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_15_output_0", "outputIndexes": [ 529 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_167_output_0", "outputIndexes": [ 530 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 530, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_21_output_0", "outputIndexes": [ 531 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 531 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_10_output_0", "outputIndexes": [ 532 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 529, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_166_output_0", "outputIndexes": [ 533 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 515, 20, 533, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_20_output_0", "outputIndexes": [ 534 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 532, 534 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_68_output_0", "outputIndexes": [ 535 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 535, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_41_output_0", "outputIndexes": [ 536 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 516, 536 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_25_output_0", "outputIndexes": [ 537 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47200024, 57366, 14336, 512, 0 ] } , "name": "/layers.5/self_attn/k_proj/Linear", "outputIndexes": [ 2332 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2332 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2333 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2333 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 538 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_162_output_0", "outputIndexes": [ 539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_163_output_0", "outputIndexes": [ 540 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 539, 540, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_66_output_0", "outputIndexes": [ 541 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 538, 541 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_47_output_0", "outputIndexes": [ 542 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_42_output_0", "outputIndexes": [ 543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542 ] , "main_type": "NONE", "name": "/Shape_73_output_0", "outputIndexes": [ 544 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 544 ] , "main_type": "NONE", "name": "Shape2003", "outputIndexes": [ 545 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 544 ] , "main_type": "NONE", "name": "Rank2005", "outputIndexes": [ 546 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 546, 546 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2007", "outputIndexes": [ 547 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 547 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2008", "outputIndexes": [ 548 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 547, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2010", "outputIndexes": [ 549 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 549 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2011", "outputIndexes": [ 550 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 545, 548, 550, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2014", "outputIndexes": [ 551 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 551 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2015", "outputIndexes": [ 552 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 552 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2016", "outputIndexes": [ 553 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 553, 552 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2017", "outputIndexes": [ 554 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 544, 554, 547 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_81_output_0", "outputIndexes": [ 555 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 555, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_16_output_0", "outputIndexes": [ 556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 556, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_169_output_0", "outputIndexes": [ 557 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 557, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_23_output_0", "outputIndexes": [ 558 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 558 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_11_output_0", "outputIndexes": [ 559 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 556, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_168_output_0", "outputIndexes": [ 560 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 542, 20, 560, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_22_output_0", "outputIndexes": [ 561 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 559, 561 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_69_output_0", "outputIndexes": [ 562 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 562, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_43_output_0", "outputIndexes": [ 563 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 543, 563 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_26_output_0", "outputIndexes": [ 564 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2327 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47272238, 57366, 14336, 512, 0 ] } , "name": "/layers.5/self_attn/v_proj/Linear", "outputIndexes": [ 2336 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2336 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2337 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2337 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 565 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 504, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_164_output_0", "outputIndexes": [ 566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 512, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_165_output_0", "outputIndexes": [ 567 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 566, 567, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_67_output_0", "outputIndexes": [ 568 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 565, 568 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_48_output_0", "outputIndexes": [ 569 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 537, 564, 569, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_53_output_0", "outputIndexes": [ 570 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 570 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2338 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2338 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2339 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2339 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47344452, 401430, 100352, 0, 0 ] } , "name": "/layers.5/self_attn/o_proj/Linear", "outputIndexes": [ 2340 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2340 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2341 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2341 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.5/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 571 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 491, 571 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_28_output_0", "outputIndexes": [ 572 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 47846234, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_5/Mul_1_output_0", "outputIndexes": [ 573 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 573 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2342 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2342 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2343 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2343 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 47853402, 2179094, 544768, 0, 0 ] } , "name": "/layers.5/mlp/gate_proj/Linear", "outputIndexes": [ 2344 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2344 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2345 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2345 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 574 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 574 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_5/Mul_output_0", "outputIndexes": [ 575 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2343 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 50577264, 2179094, 544768, 0, 0 ] } , "name": "/layers.5/mlp/up_proj/Linear", "outputIndexes": [ 2348 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2348 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2349 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2349 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 576 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 575, 576 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_5/Mul_output_0", "outputIndexes": [ 577 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 577 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2350 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2350 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.5/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2351 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2351 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 53301126, 2179094, 544768, 0, 0 ] } , "name": "/layers.5/mlp/down_proj/Linear", "outputIndexes": [ 2352 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2352 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2353 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2353 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.5/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 578 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 572, 578 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_29_output_0", "outputIndexes": [ 579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 579, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_54_output_0", "outputIndexes": [ 580 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 56024988, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_6/Mul_1_output_0", "outputIndexes": [ 581 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2354 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2354 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2355 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56032156, 401430, 100352, 3584, 0 ] } , "name": "/layers.6/self_attn/q_proj/Linear", "outputIndexes": [ 2356 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2356 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2357 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2357 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 582 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 581 ] , "main_type": "NONE", "name": "/Shape_84_output_0", "outputIndexes": [ 583 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 583 ] , "main_type": "NONE", "name": "Shape2336", "outputIndexes": [ 584 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 583 ] , "main_type": "NONE", "name": "Rank2338", "outputIndexes": [ 585 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 585, 585 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2340", "outputIndexes": [ 586 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2341", "outputIndexes": [ 587 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2343", "outputIndexes": [ 588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2344", "outputIndexes": [ 589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 587, 589, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2347", "outputIndexes": [ 590 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 590 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2348", "outputIndexes": [ 591 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 591, 591 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2350", "outputIndexes": [ 592 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 592, 586 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_93_output_0", "outputIndexes": [ 593 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_192_output_0", "outputIndexes": [ 594 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 586 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2358", "outputIndexes": [ 595 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2361", "outputIndexes": [ 596 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 584, 595, 596, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2364", "outputIndexes": [ 597 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 597 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2365", "outputIndexes": [ 598 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 598 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2366", "outputIndexes": [ 599 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 599, 598 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2367", "outputIndexes": [ 600 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 583, 600, 586 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_94_output_0", "outputIndexes": [ 601 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_193_output_0", "outputIndexes": [ 602 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 594, 602, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_78_output_0", "outputIndexes": [ 603 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 582, 603 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_55_output_0", "outputIndexes": [ 604 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_48_output_0", "outputIndexes": [ 605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604 ] , "main_type": "NONE", "name": "/Shape_86_output_0", "outputIndexes": [ 606 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 606 ] , "main_type": "NONE", "name": "Shape2467", "outputIndexes": [ 607 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 606 ] , "main_type": "NONE", "name": "Rank2469", "outputIndexes": [ 608 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 608, 608 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2471", "outputIndexes": [ 609 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2472", "outputIndexes": [ 610 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 609, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2474", "outputIndexes": [ 611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 611 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2475", "outputIndexes": [ 612 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 607, 610, 612, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2478", "outputIndexes": [ 613 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 613 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2479", "outputIndexes": [ 614 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 614 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2480", "outputIndexes": [ 615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 615, 614 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2481", "outputIndexes": [ 616 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 606, 616, 609 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_95_output_0", "outputIndexes": [ 617 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 617, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_18_output_0", "outputIndexes": [ 618 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_199_output_0", "outputIndexes": [ 619 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 619, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_25_output_0", "outputIndexes": [ 620 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 620 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_12_output_0", "outputIndexes": [ 621 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 618, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_198_output_0", "outputIndexes": [ 622 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 604, 20, 622, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_24_output_0", "outputIndexes": [ 623 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 621, 623 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_81_output_0", "outputIndexes": [ 624 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 624, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_49_output_0", "outputIndexes": [ 625 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 605, 625 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_30_output_0", "outputIndexes": [ 626 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56537522, 57366, 14336, 512, 0 ] } , "name": "/layers.6/self_attn/k_proj/Linear", "outputIndexes": [ 2360 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2360 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2361 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2361 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 627 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_194_output_0", "outputIndexes": [ 628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_195_output_0", "outputIndexes": [ 629 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 628, 629, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_79_output_0", "outputIndexes": [ 630 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 627, 630 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_56_output_0", "outputIndexes": [ 631 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_50_output_0", "outputIndexes": [ 632 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631 ] , "main_type": "NONE", "name": "/Shape_87_output_0", "outputIndexes": [ 633 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 633 ] , "main_type": "NONE", "name": "Shape2374", "outputIndexes": [ 634 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 633 ] , "main_type": "NONE", "name": "Rank2376", "outputIndexes": [ 635 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 635, 635 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2378", "outputIndexes": [ 636 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2379", "outputIndexes": [ 637 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 636, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2381", "outputIndexes": [ 638 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 638 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2382", "outputIndexes": [ 639 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 634, 637, 639, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2385", "outputIndexes": [ 640 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 640 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2386", "outputIndexes": [ 641 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 641 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2387", "outputIndexes": [ 642 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 642, 641 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2388", "outputIndexes": [ 643 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 633, 643, 636 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_96_output_0", "outputIndexes": [ 644 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 644, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_19_output_0", "outputIndexes": [ 645 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 645, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_201_output_0", "outputIndexes": [ 646 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 646, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_27_output_0", "outputIndexes": [ 647 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 647 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_13_output_0", "outputIndexes": [ 648 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 645, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_200_output_0", "outputIndexes": [ 649 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 631, 20, 649, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_26_output_0", "outputIndexes": [ 650 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 648, 650 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_82_output_0", "outputIndexes": [ 651 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 651, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_51_output_0", "outputIndexes": [ 652 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 632, 652 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_31_output_0", "outputIndexes": [ 653 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2355 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56609736, 57366, 14336, 512, 0 ] } , "name": "/layers.6/self_attn/v_proj/Linear", "outputIndexes": [ 2364 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2364 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2365 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2365 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 654 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 593, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_196_output_0", "outputIndexes": [ 655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 601, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_197_output_0", "outputIndexes": [ 656 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 655, 656, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_80_output_0", "outputIndexes": [ 657 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 654, 657 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_57_output_0", "outputIndexes": [ 658 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 626, 653, 658, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_62_output_0", "outputIndexes": [ 659 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 659 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2366 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2366 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2367 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2367 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 56681950, 401430, 100352, 0, 0 ] } , "name": "/layers.6/self_attn/o_proj/Linear", "outputIndexes": [ 2368 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2368 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2369 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2369 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.6/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 660 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 580, 660 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_33_output_0", "outputIndexes": [ 661 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 57183732, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_6/Mul_1_output_0", "outputIndexes": [ 662 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 662 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2370 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2370 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2371 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 57190900, 2179094, 544768, 0, 0 ] } , "name": "/layers.6/mlp/gate_proj/Linear", "outputIndexes": [ 2372 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2372 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2373 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2373 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 663 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 663 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_6/Mul_output_0", "outputIndexes": [ 664 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2371 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 59914762, 2179094, 544768, 0, 0 ] } , "name": "/layers.6/mlp/up_proj/Linear", "outputIndexes": [ 2376 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2376 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2377 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2377 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 665 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 664, 665 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_6/Mul_output_0", "outputIndexes": [ 666 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 666 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2378 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2378 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.6/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2379 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2379 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 62638624, 2179094, 544768, 0, 0 ] } , "name": "/layers.6/mlp/down_proj/Linear", "outputIndexes": [ 2380 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2380 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2381 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2381 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.6/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 667 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 661, 667 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_34_output_0", "outputIndexes": [ 668 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 668, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_63_output_0", "outputIndexes": [ 669 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 65362486, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_7/Mul_1_output_0", "outputIndexes": [ 670 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2382 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2382 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2383 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65369654, 401430, 100352, 3584, 0 ] } , "name": "/layers.7/self_attn/q_proj/Linear", "outputIndexes": [ 2384 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2384 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2385 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2385 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 671 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 670 ] , "main_type": "NONE", "name": "/Shape_98_output_0", "outputIndexes": [ 672 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 672 ] , "main_type": "NONE", "name": "Shape2706", "outputIndexes": [ 673 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 672 ] , "main_type": "NONE", "name": "Rank2708", "outputIndexes": [ 674 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 674, 674 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2710", "outputIndexes": [ 675 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2711", "outputIndexes": [ 676 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2713", "outputIndexes": [ 677 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2714", "outputIndexes": [ 678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 676, 678, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2717", "outputIndexes": [ 679 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 679 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2718", "outputIndexes": [ 680 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 680, 680 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2720", "outputIndexes": [ 681 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 681, 675 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_108_output_0", "outputIndexes": [ 682 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_224_output_0", "outputIndexes": [ 683 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 675 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2728", "outputIndexes": [ 684 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2731", "outputIndexes": [ 685 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 673, 684, 685, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2734", "outputIndexes": [ 686 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 686 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2735", "outputIndexes": [ 687 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 687 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2736", "outputIndexes": [ 688 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 688, 687 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2737", "outputIndexes": [ 689 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 672, 689, 675 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_109_output_0", "outputIndexes": [ 690 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_225_output_0", "outputIndexes": [ 691 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 683, 691, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_91_output_0", "outputIndexes": [ 692 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 671, 692 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_64_output_0", "outputIndexes": [ 693 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_56_output_0", "outputIndexes": [ 694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693 ] , "main_type": "NONE", "name": "/Shape_100_output_0", "outputIndexes": [ 695 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 695 ] , "main_type": "NONE", "name": "Shape2838", "outputIndexes": [ 696 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 695 ] , "main_type": "NONE", "name": "Rank2840", "outputIndexes": [ 697 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 697, 697 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2842", "outputIndexes": [ 698 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2843", "outputIndexes": [ 699 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 698, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2845", "outputIndexes": [ 700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 700 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2846", "outputIndexes": [ 701 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 696, 699, 701, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2849", "outputIndexes": [ 702 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 702 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2850", "outputIndexes": [ 703 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 703 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2851", "outputIndexes": [ 704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 704, 703 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2852", "outputIndexes": [ 705 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 695, 705, 698 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_110_output_0", "outputIndexes": [ 706 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 706, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_21_output_0", "outputIndexes": [ 707 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_231_output_0", "outputIndexes": [ 708 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 708, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_29_output_0", "outputIndexes": [ 709 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 709 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_14_output_0", "outputIndexes": [ 710 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 707, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_230_output_0", "outputIndexes": [ 711 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 693, 20, 711, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_28_output_0", "outputIndexes": [ 712 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 710, 712 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_94_output_0", "outputIndexes": [ 713 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 713, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_57_output_0", "outputIndexes": [ 714 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 694, 714 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_35_output_0", "outputIndexes": [ 715 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65875020, 57366, 14336, 512, 0 ] } , "name": "/layers.7/self_attn/k_proj/Linear", "outputIndexes": [ 2388 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2388 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2389 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2389 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 716 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_226_output_0", "outputIndexes": [ 717 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_227_output_0", "outputIndexes": [ 718 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 717, 718, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_92_output_0", "outputIndexes": [ 719 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 716, 719 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_65_output_0", "outputIndexes": [ 720 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_58_output_0", "outputIndexes": [ 721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720 ] , "main_type": "NONE", "name": "/Shape_101_output_0", "outputIndexes": [ 722 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 722 ] , "main_type": "NONE", "name": "Shape2744", "outputIndexes": [ 723 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 722 ] , "main_type": "NONE", "name": "Rank2746", "outputIndexes": [ 724 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 724, 724 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2748", "outputIndexes": [ 725 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2749", "outputIndexes": [ 726 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 725, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2751", "outputIndexes": [ 727 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 727 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze2752", "outputIndexes": [ 728 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 723, 726, 728, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice2755", "outputIndexes": [ 729 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 729 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze2756", "outputIndexes": [ 730 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 730 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2757", "outputIndexes": [ 731 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 731, 730 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp2758", "outputIndexes": [ 732 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 722, 732, 725 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_111_output_0", "outputIndexes": [ 733 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 733, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_22_output_0", "outputIndexes": [ 734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_233_output_0", "outputIndexes": [ 735 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 735, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_31_output_0", "outputIndexes": [ 736 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 736 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_15_output_0", "outputIndexes": [ 737 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 734, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_232_output_0", "outputIndexes": [ 738 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 720, 20, 738, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_30_output_0", "outputIndexes": [ 739 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 737, 739 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_95_output_0", "outputIndexes": [ 740 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 740, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_59_output_0", "outputIndexes": [ 741 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 721, 741 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_36_output_0", "outputIndexes": [ 742 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2383 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 65947234, 57366, 14336, 512, 0 ] } , "name": "/layers.7/self_attn/v_proj/Linear", "outputIndexes": [ 2392 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2392 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2393 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2393 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 743 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 682, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_228_output_0", "outputIndexes": [ 744 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 690, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_229_output_0", "outputIndexes": [ 745 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 744, 745, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_93_output_0", "outputIndexes": [ 746 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 743, 746 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_66_output_0", "outputIndexes": [ 747 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 715, 742, 747, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_71_output_0", "outputIndexes": [ 748 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 748 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2394 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2394 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2395 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2395 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 66019448, 401430, 100352, 0, 0 ] } , "name": "/layers.7/self_attn/o_proj/Linear", "outputIndexes": [ 2396 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2396 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2397 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2397 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.7/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 749 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 669, 749 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_38_output_0", "outputIndexes": [ 750 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 66521230, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_7/Mul_1_output_0", "outputIndexes": [ 751 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 751 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2398 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2398 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2399 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 66528398, 2179094, 544768, 0, 0 ] } , "name": "/layers.7/mlp/gate_proj/Linear", "outputIndexes": [ 2400 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2400 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2401 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2401 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 752 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 752 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_7/Mul_output_0", "outputIndexes": [ 753 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2399 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 69252260, 2179094, 544768, 0, 0 ] } , "name": "/layers.7/mlp/up_proj/Linear", "outputIndexes": [ 2404 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2404 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2405 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2405 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 754 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 753, 754 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_7/Mul_output_0", "outputIndexes": [ 755 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 755 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2406 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2406 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.7/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2407 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2407 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 71976122, 2179094, 544768, 0, 0 ] } , "name": "/layers.7/mlp/down_proj/Linear", "outputIndexes": [ 2408 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2408 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2409 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2409 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.7/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 756 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 750, 756 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_39_output_0", "outputIndexes": [ 757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 757, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_72_output_0", "outputIndexes": [ 758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 74699984, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_8/Mul_1_output_0", "outputIndexes": [ 759 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2410 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2410 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2411 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 74707152, 401430, 100352, 3584, 0 ] } , "name": "/layers.8/self_attn/q_proj/Linear", "outputIndexes": [ 2412 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2412 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2413 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2413 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 760 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 759 ] , "main_type": "NONE", "name": "/Shape_112_output_0", "outputIndexes": [ 761 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 761 ] , "main_type": "NONE", "name": "Shape3077", "outputIndexes": [ 762 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 761 ] , "main_type": "NONE", "name": "Rank3079", "outputIndexes": [ 763 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 763, 763 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3081", "outputIndexes": [ 764 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3082", "outputIndexes": [ 765 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3084", "outputIndexes": [ 766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3085", "outputIndexes": [ 767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 765, 767, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3088", "outputIndexes": [ 768 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 768 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3089", "outputIndexes": [ 769 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 769, 769 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3091", "outputIndexes": [ 770 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 770, 764 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_123_output_0", "outputIndexes": [ 771 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_256_output_0", "outputIndexes": [ 772 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 764 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3099", "outputIndexes": [ 773 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3102", "outputIndexes": [ 774 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 762, 773, 774, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3105", "outputIndexes": [ 775 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 775 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3106", "outputIndexes": [ 776 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 776 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3107", "outputIndexes": [ 777 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 777, 776 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3108", "outputIndexes": [ 778 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 761, 778, 764 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_124_output_0", "outputIndexes": [ 779 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_257_output_0", "outputIndexes": [ 780 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 772, 780, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_104_output_0", "outputIndexes": [ 781 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 760, 781 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_73_output_0", "outputIndexes": [ 782 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_64_output_0", "outputIndexes": [ 783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782 ] , "main_type": "NONE", "name": "/Shape_114_output_0", "outputIndexes": [ 784 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Shape3209", "outputIndexes": [ 785 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 784 ] , "main_type": "NONE", "name": "Rank3211", "outputIndexes": [ 786 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 786, 786 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3213", "outputIndexes": [ 787 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3214", "outputIndexes": [ 788 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 787, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3216", "outputIndexes": [ 789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 789 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3217", "outputIndexes": [ 790 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 785, 788, 790, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3220", "outputIndexes": [ 791 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 791 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3221", "outputIndexes": [ 792 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 792 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3222", "outputIndexes": [ 793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 793, 792 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3223", "outputIndexes": [ 794 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 784, 794, 787 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_125_output_0", "outputIndexes": [ 795 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 795, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_24_output_0", "outputIndexes": [ 796 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_263_output_0", "outputIndexes": [ 797 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 797, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_33_output_0", "outputIndexes": [ 798 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 798 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_16_output_0", "outputIndexes": [ 799 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 796, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_262_output_0", "outputIndexes": [ 800 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 782, 20, 800, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_32_output_0", "outputIndexes": [ 801 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 799, 801 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_107_output_0", "outputIndexes": [ 802 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 802, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_65_output_0", "outputIndexes": [ 803 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 783, 803 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_40_output_0", "outputIndexes": [ 804 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75212518, 57366, 14336, 512, 0 ] } , "name": "/layers.8/self_attn/k_proj/Linear", "outputIndexes": [ 2416 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2416 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2417 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2417 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 805 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_258_output_0", "outputIndexes": [ 806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_259_output_0", "outputIndexes": [ 807 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 806, 807, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_105_output_0", "outputIndexes": [ 808 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 805, 808 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_74_output_0", "outputIndexes": [ 809 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_66_output_0", "outputIndexes": [ 810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809 ] , "main_type": "NONE", "name": "/Shape_115_output_0", "outputIndexes": [ 811 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "Shape3115", "outputIndexes": [ 812 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 811 ] , "main_type": "NONE", "name": "Rank3117", "outputIndexes": [ 813 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 813, 813 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3119", "outputIndexes": [ 814 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3120", "outputIndexes": [ 815 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 814, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3122", "outputIndexes": [ 816 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 816 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3123", "outputIndexes": [ 817 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 812, 815, 817, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3126", "outputIndexes": [ 818 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 818 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3127", "outputIndexes": [ 819 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 819 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3128", "outputIndexes": [ 820 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 820, 819 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3129", "outputIndexes": [ 821 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 811, 821, 814 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_126_output_0", "outputIndexes": [ 822 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 822, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_25_output_0", "outputIndexes": [ 823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 823, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_265_output_0", "outputIndexes": [ 824 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 824, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_35_output_0", "outputIndexes": [ 825 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 825 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_17_output_0", "outputIndexes": [ 826 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 823, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_264_output_0", "outputIndexes": [ 827 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 809, 20, 827, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_34_output_0", "outputIndexes": [ 828 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 826, 828 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_108_output_0", "outputIndexes": [ 829 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 829, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_67_output_0", "outputIndexes": [ 830 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 810, 830 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_41_output_0", "outputIndexes": [ 831 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2411 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75284732, 57366, 14336, 512, 0 ] } , "name": "/layers.8/self_attn/v_proj/Linear", "outputIndexes": [ 2420 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2420 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2421 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2421 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 832 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 771, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_260_output_0", "outputIndexes": [ 833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 779, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_261_output_0", "outputIndexes": [ 834 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 833, 834, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_106_output_0", "outputIndexes": [ 835 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 832, 835 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_75_output_0", "outputIndexes": [ 836 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 804, 831, 836, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_80_output_0", "outputIndexes": [ 837 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 837 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2422 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2422 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2423 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2423 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75356946, 401430, 100352, 0, 0 ] } , "name": "/layers.8/self_attn/o_proj/Linear", "outputIndexes": [ 2424 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2424 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2425 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2425 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.8/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 838 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 758, 838 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_43_output_0", "outputIndexes": [ 839 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 75858728, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_8/Mul_1_output_0", "outputIndexes": [ 840 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 840 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2426 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2426 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2427 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 75865896, 2179094, 544768, 0, 0 ] } , "name": "/layers.8/mlp/gate_proj/Linear", "outputIndexes": [ 2428 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2428 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2429 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2429 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 841 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 841 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_8/Mul_output_0", "outputIndexes": [ 842 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2427 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 78589758, 2179094, 544768, 0, 0 ] } , "name": "/layers.8/mlp/up_proj/Linear", "outputIndexes": [ 2432 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2432 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2433 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2433 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 843 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 842, 843 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_8/Mul_output_0", "outputIndexes": [ 844 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 844 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2434 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2434 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.8/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2435 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2435 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 81313620, 2179094, 544768, 0, 0 ] } , "name": "/layers.8/mlp/down_proj/Linear", "outputIndexes": [ 2436 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2436 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2437 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2437 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.8/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 845 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 839, 845 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_44_output_0", "outputIndexes": [ 846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 846, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_81_output_0", "outputIndexes": [ 847 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 84037482, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_9/Mul_1_output_0", "outputIndexes": [ 848 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2438 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2438 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2439 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 84044650, 401430, 100352, 3584, 0 ] } , "name": "/layers.9/self_attn/q_proj/Linear", "outputIndexes": [ 2440 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2440 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2441 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2441 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 849 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 848 ] , "main_type": "NONE", "name": "/Shape_126_output_0", "outputIndexes": [ 850 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "Shape3448", "outputIndexes": [ 851 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 850 ] , "main_type": "NONE", "name": "Rank3450", "outputIndexes": [ 852 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 852, 852 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3452", "outputIndexes": [ 853 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3453", "outputIndexes": [ 854 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3455", "outputIndexes": [ 855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3456", "outputIndexes": [ 856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 854, 856, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3459", "outputIndexes": [ 857 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 857 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3460", "outputIndexes": [ 858 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 858, 858 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3462", "outputIndexes": [ 859 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 859, 853 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_138_output_0", "outputIndexes": [ 860 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_288_output_0", "outputIndexes": [ 861 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 853 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3470", "outputIndexes": [ 862 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3473", "outputIndexes": [ 863 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 851, 862, 863, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3476", "outputIndexes": [ 864 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 864 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3477", "outputIndexes": [ 865 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 865 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3478", "outputIndexes": [ 866 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 866, 865 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3479", "outputIndexes": [ 867 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 850, 867, 853 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_139_output_0", "outputIndexes": [ 868 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_289_output_0", "outputIndexes": [ 869 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 861, 869, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_117_output_0", "outputIndexes": [ 870 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 849, 870 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_82_output_0", "outputIndexes": [ 871 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_72_output_0", "outputIndexes": [ 872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871 ] , "main_type": "NONE", "name": "/Shape_128_output_0", "outputIndexes": [ 873 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 873 ] , "main_type": "NONE", "name": "Shape3580", "outputIndexes": [ 874 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 873 ] , "main_type": "NONE", "name": "Rank3582", "outputIndexes": [ 875 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 875, 875 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3584", "outputIndexes": [ 876 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3585", "outputIndexes": [ 877 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 876, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3587", "outputIndexes": [ 878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 878 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3588", "outputIndexes": [ 879 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 874, 877, 879, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3591", "outputIndexes": [ 880 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 880 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3592", "outputIndexes": [ 881 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 881 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3593", "outputIndexes": [ 882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 882, 881 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3594", "outputIndexes": [ 883 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 873, 883, 876 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_140_output_0", "outputIndexes": [ 884 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 884, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_27_output_0", "outputIndexes": [ 885 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_295_output_0", "outputIndexes": [ 886 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 886, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_37_output_0", "outputIndexes": [ 887 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 887 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_18_output_0", "outputIndexes": [ 888 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 885, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_294_output_0", "outputIndexes": [ 889 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 871, 20, 889, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_36_output_0", "outputIndexes": [ 890 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 888, 890 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_120_output_0", "outputIndexes": [ 891 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 891, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_73_output_0", "outputIndexes": [ 892 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 872, 892 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_45_output_0", "outputIndexes": [ 893 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 84550016, 57366, 14336, 512, 0 ] } , "name": "/layers.9/self_attn/k_proj/Linear", "outputIndexes": [ 2444 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2444 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2445 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2445 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 894 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_290_output_0", "outputIndexes": [ 895 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_291_output_0", "outputIndexes": [ 896 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 895, 896, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_118_output_0", "outputIndexes": [ 897 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 894, 897 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_83_output_0", "outputIndexes": [ 898 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_74_output_0", "outputIndexes": [ 899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898 ] , "main_type": "NONE", "name": "/Shape_129_output_0", "outputIndexes": [ 900 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 900 ] , "main_type": "NONE", "name": "Shape3486", "outputIndexes": [ 901 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 900 ] , "main_type": "NONE", "name": "Rank3488", "outputIndexes": [ 902 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 902, 902 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3490", "outputIndexes": [ 903 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 903 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3491", "outputIndexes": [ 904 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 903, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3493", "outputIndexes": [ 905 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 905 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3494", "outputIndexes": [ 906 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 901, 904, 906, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3497", "outputIndexes": [ 907 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 907 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3498", "outputIndexes": [ 908 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 908 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3499", "outputIndexes": [ 909 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 909, 908 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3500", "outputIndexes": [ 910 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 900, 910, 903 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_141_output_0", "outputIndexes": [ 911 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 911, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_28_output_0", "outputIndexes": [ 912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 912, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_297_output_0", "outputIndexes": [ 913 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 913, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_39_output_0", "outputIndexes": [ 914 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 914 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_19_output_0", "outputIndexes": [ 915 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 912, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_296_output_0", "outputIndexes": [ 916 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 898, 20, 916, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_38_output_0", "outputIndexes": [ 917 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 915, 917 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_121_output_0", "outputIndexes": [ 918 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 918, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_75_output_0", "outputIndexes": [ 919 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 899, 919 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_46_output_0", "outputIndexes": [ 920 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2439 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 84622230, 57366, 14336, 512, 0 ] } , "name": "/layers.9/self_attn/v_proj/Linear", "outputIndexes": [ 2448 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2448 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2449 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2449 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 921 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 860, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_292_output_0", "outputIndexes": [ 922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 868, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_293_output_0", "outputIndexes": [ 923 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 922, 923, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_119_output_0", "outputIndexes": [ 924 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 921, 924 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_84_output_0", "outputIndexes": [ 925 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 893, 920, 925, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_89_output_0", "outputIndexes": [ 926 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 926 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2450 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2450 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2451 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2451 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 84694444, 401430, 100352, 0, 0 ] } , "name": "/layers.9/self_attn/o_proj/Linear", "outputIndexes": [ 2452 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2452 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2453 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2453 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.9/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 927 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 847, 927 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_48_output_0", "outputIndexes": [ 928 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 85196226, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_9/Mul_1_output_0", "outputIndexes": [ 929 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 929 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2454 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2454 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2455 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 85203394, 2179094, 544768, 0, 0 ] } , "name": "/layers.9/mlp/gate_proj/Linear", "outputIndexes": [ 2456 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2456 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2457 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2457 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 930 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 930 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_9/Mul_output_0", "outputIndexes": [ 931 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2455 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 87927256, 2179094, 544768, 0, 0 ] } , "name": "/layers.9/mlp/up_proj/Linear", "outputIndexes": [ 2460 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2460 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2461 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2461 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 932 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 931, 932 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_9/Mul_output_0", "outputIndexes": [ 933 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 933 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2462 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2462 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.9/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2463 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2463 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 90651118, 2179094, 544768, 0, 0 ] } , "name": "/layers.9/mlp/down_proj/Linear", "outputIndexes": [ 2464 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2464 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2465 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2465 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.9/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 934 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 928, 934 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_49_output_0", "outputIndexes": [ 935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 935, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_90_output_0", "outputIndexes": [ 936 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 93374980, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_10/Mul_1_output_0", "outputIndexes": [ 937 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2466 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2467 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 93382148, 401430, 100352, 3584, 0 ] } , "name": "/layers.10/self_attn/q_proj/Linear", "outputIndexes": [ 2468 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2468 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2469 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2469 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 938 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 937 ] , "main_type": "NONE", "name": "/Shape_140_output_0", "outputIndexes": [ 939 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 939 ] , "main_type": "NONE", "name": "Shape3819", "outputIndexes": [ 940 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 939 ] , "main_type": "NONE", "name": "Rank3821", "outputIndexes": [ 941 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 941, 941 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3823", "outputIndexes": [ 942 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3824", "outputIndexes": [ 943 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3826", "outputIndexes": [ 944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3827", "outputIndexes": [ 945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 943, 945, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3830", "outputIndexes": [ 946 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 946 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3831", "outputIndexes": [ 947 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 947, 947 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3833", "outputIndexes": [ 948 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939, 948, 942 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_153_output_0", "outputIndexes": [ 949 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_320_output_0", "outputIndexes": [ 950 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 942 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3841", "outputIndexes": [ 951 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3844", "outputIndexes": [ 952 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 940, 951, 952, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3847", "outputIndexes": [ 953 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 953 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3848", "outputIndexes": [ 954 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 954 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3849", "outputIndexes": [ 955 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 955, 954 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3850", "outputIndexes": [ 956 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 939, 956, 942 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_154_output_0", "outputIndexes": [ 957 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_321_output_0", "outputIndexes": [ 958 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 950, 958, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_130_output_0", "outputIndexes": [ 959 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 938, 959 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_91_output_0", "outputIndexes": [ 960 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_80_output_0", "outputIndexes": [ 961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960 ] , "main_type": "NONE", "name": "/Shape_142_output_0", "outputIndexes": [ 962 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 962 ] , "main_type": "NONE", "name": "Shape3951", "outputIndexes": [ 963 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 962 ] , "main_type": "NONE", "name": "Rank3953", "outputIndexes": [ 964 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 964, 964 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3955", "outputIndexes": [ 965 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 965 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3956", "outputIndexes": [ 966 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 965, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3958", "outputIndexes": [ 967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 967 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3959", "outputIndexes": [ 968 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 963, 966, 968, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3962", "outputIndexes": [ 969 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 969 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3963", "outputIndexes": [ 970 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 970 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3964", "outputIndexes": [ 971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 971, 970 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3965", "outputIndexes": [ 972 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 962, 972, 965 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_155_output_0", "outputIndexes": [ 973 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 973, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_30_output_0", "outputIndexes": [ 974 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 974, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_327_output_0", "outputIndexes": [ 975 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 975, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_41_output_0", "outputIndexes": [ 976 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 976 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_20_output_0", "outputIndexes": [ 977 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 974, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_326_output_0", "outputIndexes": [ 978 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 960, 20, 978, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_40_output_0", "outputIndexes": [ 979 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 977, 979 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_133_output_0", "outputIndexes": [ 980 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 980, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_81_output_0", "outputIndexes": [ 981 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 961, 981 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_50_output_0", "outputIndexes": [ 982 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 93887514, 57366, 14336, 512, 0 ] } , "name": "/layers.10/self_attn/k_proj/Linear", "outputIndexes": [ 2472 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2472 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2473 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2473 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 983 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_322_output_0", "outputIndexes": [ 984 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_323_output_0", "outputIndexes": [ 985 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 984, 985, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_131_output_0", "outputIndexes": [ 986 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 983, 986 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_92_output_0", "outputIndexes": [ 987 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_82_output_0", "outputIndexes": [ 988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987 ] , "main_type": "NONE", "name": "/Shape_143_output_0", "outputIndexes": [ 989 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 989 ] , "main_type": "NONE", "name": "Shape3857", "outputIndexes": [ 990 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 989 ] , "main_type": "NONE", "name": "Rank3859", "outputIndexes": [ 991 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 991, 991 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3861", "outputIndexes": [ 992 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3862", "outputIndexes": [ 993 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 992, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3864", "outputIndexes": [ 994 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 994 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze3865", "outputIndexes": [ 995 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 990, 993, 995, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice3868", "outputIndexes": [ 996 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 996 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze3869", "outputIndexes": [ 997 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 997 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3870", "outputIndexes": [ 998 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 998, 997 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp3871", "outputIndexes": [ 999 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 989, 999, 992 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_156_output_0", "outputIndexes": [ 1000 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1000, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_31_output_0", "outputIndexes": [ 1001 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_329_output_0", "outputIndexes": [ 1002 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 1002, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_43_output_0", "outputIndexes": [ 1003 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1003 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_21_output_0", "outputIndexes": [ 1004 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1001, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_328_output_0", "outputIndexes": [ 1005 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 987, 20, 1005, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_42_output_0", "outputIndexes": [ 1006 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1004, 1006 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_134_output_0", "outputIndexes": [ 1007 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1007, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_83_output_0", "outputIndexes": [ 1008 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 988, 1008 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_51_output_0", "outputIndexes": [ 1009 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2467 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 93959728, 57366, 14336, 512, 0 ] } , "name": "/layers.10/self_attn/v_proj/Linear", "outputIndexes": [ 2476 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2476 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2477 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2477 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1010 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 949, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_324_output_0", "outputIndexes": [ 1011 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 957, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_325_output_0", "outputIndexes": [ 1012 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1011, 1012, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_132_output_0", "outputIndexes": [ 1013 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1010, 1013 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_93_output_0", "outputIndexes": [ 1014 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 982, 1009, 1014, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_98_output_0", "outputIndexes": [ 1015 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1015 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2478 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2478 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2479 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2479 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 94031942, 401430, 100352, 0, 0 ] } , "name": "/layers.10/self_attn/o_proj/Linear", "outputIndexes": [ 2480 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2480 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2481 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2481 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.10/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1016 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 936, 1016 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_53_output_0", "outputIndexes": [ 1017 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 94533724, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_10/Mul_1_output_0", "outputIndexes": [ 1018 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1018 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2482 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2482 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2483 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 94540892, 2179094, 544768, 0, 0 ] } , "name": "/layers.10/mlp/gate_proj/Linear", "outputIndexes": [ 2484 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2484 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2485 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2485 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1019 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1019 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_10/Mul_output_0", "outputIndexes": [ 1020 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2483 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 97264754, 2179094, 544768, 0, 0 ] } , "name": "/layers.10/mlp/up_proj/Linear", "outputIndexes": [ 2488 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2488 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2489 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2489 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1021 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1020, 1021 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_10/Mul_output_0", "outputIndexes": [ 1022 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1022 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2490 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2490 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.10/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2491 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2491 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 99988616, 2179094, 544768, 0, 0 ] } , "name": "/layers.10/mlp/down_proj/Linear", "outputIndexes": [ 2492 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2492 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2493 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2493 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.10/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1023 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1017, 1023 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_54_output_0", "outputIndexes": [ 1024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1024, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_99_output_0", "outputIndexes": [ 1025 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 102712478, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_11/Mul_1_output_0", "outputIndexes": [ 1026 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2494 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2494 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2495 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 102719646, 401430, 100352, 3584, 0 ] } , "name": "/layers.11/self_attn/q_proj/Linear", "outputIndexes": [ 2496 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2496 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2497 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2497 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1027 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1026 ] , "main_type": "NONE", "name": "/Shape_154_output_0", "outputIndexes": [ 1028 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1028 ] , "main_type": "NONE", "name": "Shape4190", "outputIndexes": [ 1029 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1028 ] , "main_type": "NONE", "name": "Rank4192", "outputIndexes": [ 1030 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1030, 1030 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4194", "outputIndexes": [ 1031 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4195", "outputIndexes": [ 1032 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4197", "outputIndexes": [ 1033 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4198", "outputIndexes": [ 1034 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029, 1032, 1034, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4201", "outputIndexes": [ 1035 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1035 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4202", "outputIndexes": [ 1036 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1036, 1036 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4204", "outputIndexes": [ 1037 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028, 1037, 1031 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_168_output_0", "outputIndexes": [ 1038 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_352_output_0", "outputIndexes": [ 1039 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1031 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4212", "outputIndexes": [ 1040 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4215", "outputIndexes": [ 1041 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1029, 1040, 1041, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4218", "outputIndexes": [ 1042 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1042 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4219", "outputIndexes": [ 1043 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1043 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4220", "outputIndexes": [ 1044 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1044, 1043 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4221", "outputIndexes": [ 1045 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1028, 1045, 1031 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_169_output_0", "outputIndexes": [ 1046 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_353_output_0", "outputIndexes": [ 1047 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1039, 1047, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_143_output_0", "outputIndexes": [ 1048 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1027, 1048 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_100_output_0", "outputIndexes": [ 1049 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_88_output_0", "outputIndexes": [ 1050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049 ] , "main_type": "NONE", "name": "/Shape_156_output_0", "outputIndexes": [ 1051 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1051 ] , "main_type": "NONE", "name": "Shape4322", "outputIndexes": [ 1052 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1051 ] , "main_type": "NONE", "name": "Rank4324", "outputIndexes": [ 1053 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1053, 1053 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4326", "outputIndexes": [ 1054 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4327", "outputIndexes": [ 1055 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1054, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4329", "outputIndexes": [ 1056 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1056 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4330", "outputIndexes": [ 1057 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1052, 1055, 1057, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4333", "outputIndexes": [ 1058 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1058 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4334", "outputIndexes": [ 1059 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1059 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4335", "outputIndexes": [ 1060 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1060, 1059 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4336", "outputIndexes": [ 1061 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1051, 1061, 1054 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_170_output_0", "outputIndexes": [ 1062 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1062, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_33_output_0", "outputIndexes": [ 1063 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_359_output_0", "outputIndexes": [ 1064 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 1064, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_45_output_0", "outputIndexes": [ 1065 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1065 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_22_output_0", "outputIndexes": [ 1066 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1063, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_358_output_0", "outputIndexes": [ 1067 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1049, 20, 1067, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_44_output_0", "outputIndexes": [ 1068 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1066, 1068 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_146_output_0", "outputIndexes": [ 1069 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1069, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_89_output_0", "outputIndexes": [ 1070 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1050, 1070 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_55_output_0", "outputIndexes": [ 1071 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103225012, 57366, 14336, 512, 0 ] } , "name": "/layers.11/self_attn/k_proj/Linear", "outputIndexes": [ 2500 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2500 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2501 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2501 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1072 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_354_output_0", "outputIndexes": [ 1073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_355_output_0", "outputIndexes": [ 1074 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1073, 1074, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_144_output_0", "outputIndexes": [ 1075 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1072, 1075 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_101_output_0", "outputIndexes": [ 1076 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_90_output_0", "outputIndexes": [ 1077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076 ] , "main_type": "NONE", "name": "/Shape_157_output_0", "outputIndexes": [ 1078 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1078 ] , "main_type": "NONE", "name": "Shape4228", "outputIndexes": [ 1079 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1078 ] , "main_type": "NONE", "name": "Rank4230", "outputIndexes": [ 1080 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1080, 1080 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4232", "outputIndexes": [ 1081 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4233", "outputIndexes": [ 1082 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1081, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4235", "outputIndexes": [ 1083 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1083 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4236", "outputIndexes": [ 1084 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1079, 1082, 1084, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4239", "outputIndexes": [ 1085 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1085 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4240", "outputIndexes": [ 1086 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1086 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4241", "outputIndexes": [ 1087 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1087, 1086 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4242", "outputIndexes": [ 1088 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1078, 1088, 1081 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_171_output_0", "outputIndexes": [ 1089 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1089, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_34_output_0", "outputIndexes": [ 1090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_361_output_0", "outputIndexes": [ 1091 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 1091, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_47_output_0", "outputIndexes": [ 1092 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1092 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_23_output_0", "outputIndexes": [ 1093 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1090, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_360_output_0", "outputIndexes": [ 1094 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1076, 20, 1094, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_46_output_0", "outputIndexes": [ 1095 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1093, 1095 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_147_output_0", "outputIndexes": [ 1096 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1096, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_91_output_0", "outputIndexes": [ 1097 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1077, 1097 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_56_output_0", "outputIndexes": [ 1098 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2495 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103297226, 57366, 14336, 512, 0 ] } , "name": "/layers.11/self_attn/v_proj/Linear", "outputIndexes": [ 2504 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2504 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2505 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2505 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1099 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1038, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_356_output_0", "outputIndexes": [ 1100 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1046, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_357_output_0", "outputIndexes": [ 1101 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1100, 1101, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_145_output_0", "outputIndexes": [ 1102 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1099, 1102 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_102_output_0", "outputIndexes": [ 1103 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1071, 1098, 1103, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_107_output_0", "outputIndexes": [ 1104 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1104 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2506 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2506 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2507 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2507 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103369440, 401430, 100352, 0, 0 ] } , "name": "/layers.11/self_attn/o_proj/Linear", "outputIndexes": [ 2508 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2508 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2509 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2509 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.11/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1105 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1025, 1105 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_58_output_0", "outputIndexes": [ 1106 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 103871222, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_11/Mul_1_output_0", "outputIndexes": [ 1107 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1107 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2510 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2510 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2511 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2511 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 103878390, 2179094, 544768, 0, 0 ] } , "name": "/layers.11/mlp/gate_proj/Linear", "outputIndexes": [ 2512 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2512 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2513 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2513 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1108 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1108 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_11/Mul_output_0", "outputIndexes": [ 1109 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2511 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 106602252, 2179094, 544768, 0, 0 ] } , "name": "/layers.11/mlp/up_proj/Linear", "outputIndexes": [ 2516 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2516 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2517 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2517 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1110 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1109, 1110 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_11/Mul_output_0", "outputIndexes": [ 1111 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1111 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2518 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2518 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.11/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2519 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2519 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 109326114, 2179094, 544768, 0, 0 ] } , "name": "/layers.11/mlp/down_proj/Linear", "outputIndexes": [ 2520 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2520 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2521 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2521 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.11/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1112 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1106, 1112 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_59_output_0", "outputIndexes": [ 1113 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1113, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_108_output_0", "outputIndexes": [ 1114 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 112049976, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_12/Mul_1_output_0", "outputIndexes": [ 1115 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2522 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2522 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2523 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 112057144, 401430, 100352, 3584, 0 ] } , "name": "/layers.12/self_attn/q_proj/Linear", "outputIndexes": [ 2524 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2524 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2525 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2525 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1116 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1115 ] , "main_type": "NONE", "name": "/Shape_168_output_0", "outputIndexes": [ 1117 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1117 ] , "main_type": "NONE", "name": "Shape4561", "outputIndexes": [ 1118 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1117 ] , "main_type": "NONE", "name": "Rank4563", "outputIndexes": [ 1119 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1119, 1119 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4565", "outputIndexes": [ 1120 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4566", "outputIndexes": [ 1121 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4568", "outputIndexes": [ 1122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4569", "outputIndexes": [ 1123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1121, 1123, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4572", "outputIndexes": [ 1124 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1124 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4573", "outputIndexes": [ 1125 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1125, 1125 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4575", "outputIndexes": [ 1126 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117, 1126, 1120 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_183_output_0", "outputIndexes": [ 1127 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_384_output_0", "outputIndexes": [ 1128 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1120 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4583", "outputIndexes": [ 1129 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4586", "outputIndexes": [ 1130 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1118, 1129, 1130, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4589", "outputIndexes": [ 1131 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1131 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4590", "outputIndexes": [ 1132 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1132 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4591", "outputIndexes": [ 1133 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1133, 1132 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4592", "outputIndexes": [ 1134 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1117, 1134, 1120 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_184_output_0", "outputIndexes": [ 1135 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_385_output_0", "outputIndexes": [ 1136 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1128, 1136, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_156_output_0", "outputIndexes": [ 1137 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1116, 1137 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_109_output_0", "outputIndexes": [ 1138 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_96_output_0", "outputIndexes": [ 1139 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138 ] , "main_type": "NONE", "name": "/Shape_170_output_0", "outputIndexes": [ 1140 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1140 ] , "main_type": "NONE", "name": "Shape4693", "outputIndexes": [ 1141 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1140 ] , "main_type": "NONE", "name": "Rank4695", "outputIndexes": [ 1142 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1142, 1142 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4697", "outputIndexes": [ 1143 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4698", "outputIndexes": [ 1144 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1143, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4700", "outputIndexes": [ 1145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1145 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4701", "outputIndexes": [ 1146 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1141, 1144, 1146, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4704", "outputIndexes": [ 1147 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1147 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4705", "outputIndexes": [ 1148 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1148 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4706", "outputIndexes": [ 1149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1149, 1148 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4707", "outputIndexes": [ 1150 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1140, 1150, 1143 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_185_output_0", "outputIndexes": [ 1151 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1151, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_36_output_0", "outputIndexes": [ 1152 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_391_output_0", "outputIndexes": [ 1153 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 1153, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_49_output_0", "outputIndexes": [ 1154 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1154 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_24_output_0", "outputIndexes": [ 1155 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1152, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_390_output_0", "outputIndexes": [ 1156 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1138, 20, 1156, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_48_output_0", "outputIndexes": [ 1157 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1155, 1157 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_159_output_0", "outputIndexes": [ 1158 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1158, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_97_output_0", "outputIndexes": [ 1159 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1139, 1159 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_60_output_0", "outputIndexes": [ 1160 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 112562510, 57366, 14336, 512, 0 ] } , "name": "/layers.12/self_attn/k_proj/Linear", "outputIndexes": [ 2528 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2528 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2529 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2529 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1161 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_386_output_0", "outputIndexes": [ 1162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_387_output_0", "outputIndexes": [ 1163 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1162, 1163, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_157_output_0", "outputIndexes": [ 1164 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1161, 1164 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_110_output_0", "outputIndexes": [ 1165 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_98_output_0", "outputIndexes": [ 1166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165 ] , "main_type": "NONE", "name": "/Shape_171_output_0", "outputIndexes": [ 1167 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Shape4599", "outputIndexes": [ 1168 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1167 ] , "main_type": "NONE", "name": "Rank4601", "outputIndexes": [ 1169 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1169, 1169 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4603", "outputIndexes": [ 1170 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4604", "outputIndexes": [ 1171 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1170, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4606", "outputIndexes": [ 1172 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1172 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4607", "outputIndexes": [ 1173 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1168, 1171, 1173, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4610", "outputIndexes": [ 1174 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1174 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4611", "outputIndexes": [ 1175 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1175 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4612", "outputIndexes": [ 1176 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1176, 1175 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4613", "outputIndexes": [ 1177 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1167, 1177, 1170 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_186_output_0", "outputIndexes": [ 1178 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1178, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_37_output_0", "outputIndexes": [ 1179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_393_output_0", "outputIndexes": [ 1180 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 1180, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_51_output_0", "outputIndexes": [ 1181 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1181 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_25_output_0", "outputIndexes": [ 1182 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1179, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_392_output_0", "outputIndexes": [ 1183 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1165, 20, 1183, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_50_output_0", "outputIndexes": [ 1184 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1182, 1184 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_160_output_0", "outputIndexes": [ 1185 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1185, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_99_output_0", "outputIndexes": [ 1186 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1166, 1186 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_61_output_0", "outputIndexes": [ 1187 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2523 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 112634724, 57366, 14336, 512, 0 ] } , "name": "/layers.12/self_attn/v_proj/Linear", "outputIndexes": [ 2532 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2532 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2533 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2533 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1188 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1127, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_388_output_0", "outputIndexes": [ 1189 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1135, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_389_output_0", "outputIndexes": [ 1190 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1189, 1190, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_158_output_0", "outputIndexes": [ 1191 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1188, 1191 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_111_output_0", "outputIndexes": [ 1192 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1160, 1187, 1192, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_116_output_0", "outputIndexes": [ 1193 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1193 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2534 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2534 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2535 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2535 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 112706938, 401430, 100352, 0, 0 ] } , "name": "/layers.12/self_attn/o_proj/Linear", "outputIndexes": [ 2536 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2536 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2537 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2537 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.12/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1194 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1114, 1194 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_63_output_0", "outputIndexes": [ 1195 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 113208720, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_12/Mul_1_output_0", "outputIndexes": [ 1196 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1196 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2538 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2538 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2539 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 113215888, 2179094, 544768, 0, 0 ] } , "name": "/layers.12/mlp/gate_proj/Linear", "outputIndexes": [ 2540 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2540 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2541 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2541 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1197 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1197 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_12/Mul_output_0", "outputIndexes": [ 1198 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2539 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 115939750, 2179094, 544768, 0, 0 ] } , "name": "/layers.12/mlp/up_proj/Linear", "outputIndexes": [ 2544 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2544 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2545 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2545 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1199 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1198, 1199 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_12/Mul_output_0", "outputIndexes": [ 1200 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1200 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2546 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2546 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.12/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2547 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2547 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 118663612, 2179094, 544768, 0, 0 ] } , "name": "/layers.12/mlp/down_proj/Linear", "outputIndexes": [ 2548 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2548 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2549 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2549 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.12/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1201 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1195, 1201 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_64_output_0", "outputIndexes": [ 1202 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1202, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_117_output_0", "outputIndexes": [ 1203 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 121387474, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_13/Mul_1_output_0", "outputIndexes": [ 1204 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2550 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2550 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2551 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 121394642, 401430, 100352, 3584, 0 ] } , "name": "/layers.13/self_attn/q_proj/Linear", "outputIndexes": [ 2552 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2552 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2553 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2553 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1205 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1204 ] , "main_type": "NONE", "name": "/Shape_182_output_0", "outputIndexes": [ 1206 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Shape4932", "outputIndexes": [ 1207 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1206 ] , "main_type": "NONE", "name": "Rank4934", "outputIndexes": [ 1208 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1208, 1208 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4936", "outputIndexes": [ 1209 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4937", "outputIndexes": [ 1210 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4939", "outputIndexes": [ 1211 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4940", "outputIndexes": [ 1212 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1210, 1212, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4943", "outputIndexes": [ 1213 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1213 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4944", "outputIndexes": [ 1214 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1214, 1214 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4946", "outputIndexes": [ 1215 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1215, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_198_output_0", "outputIndexes": [ 1216 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_416_output_0", "outputIndexes": [ 1217 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1209 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4954", "outputIndexes": [ 1218 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1211 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4957", "outputIndexes": [ 1219 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1207, 1218, 1219, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4960", "outputIndexes": [ 1220 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1220 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4961", "outputIndexes": [ 1221 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1221 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4962", "outputIndexes": [ 1222 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1222, 1221 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4963", "outputIndexes": [ 1223 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1206, 1223, 1209 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_199_output_0", "outputIndexes": [ 1224 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_417_output_0", "outputIndexes": [ 1225 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1217, 1225, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_169_output_0", "outputIndexes": [ 1226 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1205, 1226 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_118_output_0", "outputIndexes": [ 1227 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_104_output_0", "outputIndexes": [ 1228 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227 ] , "main_type": "NONE", "name": "/Shape_184_output_0", "outputIndexes": [ 1229 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "Shape5064", "outputIndexes": [ 1230 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1229 ] , "main_type": "NONE", "name": "Rank5066", "outputIndexes": [ 1231 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1231, 1231 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5068", "outputIndexes": [ 1232 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5069", "outputIndexes": [ 1233 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1232, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5071", "outputIndexes": [ 1234 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1234 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5072", "outputIndexes": [ 1235 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1230, 1233, 1235, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5075", "outputIndexes": [ 1236 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1236 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5076", "outputIndexes": [ 1237 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1237 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5077", "outputIndexes": [ 1238 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1238, 1237 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5078", "outputIndexes": [ 1239 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1229, 1239, 1232 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_200_output_0", "outputIndexes": [ 1240 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1240, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_39_output_0", "outputIndexes": [ 1241 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1241, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_423_output_0", "outputIndexes": [ 1242 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 1242, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_53_output_0", "outputIndexes": [ 1243 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1243 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_26_output_0", "outputIndexes": [ 1244 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1241, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_422_output_0", "outputIndexes": [ 1245 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1227, 20, 1245, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_52_output_0", "outputIndexes": [ 1246 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1244, 1246 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_172_output_0", "outputIndexes": [ 1247 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1247, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_105_output_0", "outputIndexes": [ 1248 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1228, 1248 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_65_output_0", "outputIndexes": [ 1249 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 121900008, 57366, 14336, 512, 0 ] } , "name": "/layers.13/self_attn/k_proj/Linear", "outputIndexes": [ 2556 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2556 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2557 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2557 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1250 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_418_output_0", "outputIndexes": [ 1251 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_419_output_0", "outputIndexes": [ 1252 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1251, 1252, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_170_output_0", "outputIndexes": [ 1253 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1250, 1253 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_119_output_0", "outputIndexes": [ 1254 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_106_output_0", "outputIndexes": [ 1255 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254 ] , "main_type": "NONE", "name": "/Shape_185_output_0", "outputIndexes": [ 1256 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "Shape4970", "outputIndexes": [ 1257 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1256 ] , "main_type": "NONE", "name": "Rank4972", "outputIndexes": [ 1258 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1258, 1258 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4974", "outputIndexes": [ 1259 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4975", "outputIndexes": [ 1260 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1259, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4977", "outputIndexes": [ 1261 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1261 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze4978", "outputIndexes": [ 1262 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1257, 1260, 1262, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice4981", "outputIndexes": [ 1263 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1263 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze4982", "outputIndexes": [ 1264 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1264 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4983", "outputIndexes": [ 1265 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1265, 1264 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp4984", "outputIndexes": [ 1266 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1256, 1266, 1259 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_201_output_0", "outputIndexes": [ 1267 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1267, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_40_output_0", "outputIndexes": [ 1268 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_425_output_0", "outputIndexes": [ 1269 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 1269, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_55_output_0", "outputIndexes": [ 1270 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1270 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_27_output_0", "outputIndexes": [ 1271 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1268, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_424_output_0", "outputIndexes": [ 1272 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1254, 20, 1272, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_54_output_0", "outputIndexes": [ 1273 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1271, 1273 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_173_output_0", "outputIndexes": [ 1274 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1274, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_107_output_0", "outputIndexes": [ 1275 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1255, 1275 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_66_output_0", "outputIndexes": [ 1276 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2551 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 121972222, 57366, 14336, 512, 0 ] } , "name": "/layers.13/self_attn/v_proj/Linear", "outputIndexes": [ 2560 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2560 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2561 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2561 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1277 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1216, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_420_output_0", "outputIndexes": [ 1278 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1224, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_421_output_0", "outputIndexes": [ 1279 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1278, 1279, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_171_output_0", "outputIndexes": [ 1280 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1277, 1280 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_120_output_0", "outputIndexes": [ 1281 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1249, 1276, 1281, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_125_output_0", "outputIndexes": [ 1282 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1282 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2562 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2562 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2563 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2563 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 122044436, 401430, 100352, 0, 0 ] } , "name": "/layers.13/self_attn/o_proj/Linear", "outputIndexes": [ 2564 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2564 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2565 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2565 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.13/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1283 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1203, 1283 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_68_output_0", "outputIndexes": [ 1284 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 122546218, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_13/Mul_1_output_0", "outputIndexes": [ 1285 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1285 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2566 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2566 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2567 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 122553386, 2179094, 544768, 0, 0 ] } , "name": "/layers.13/mlp/gate_proj/Linear", "outputIndexes": [ 2568 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2568 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2569 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2569 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1286 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1286 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_13/Mul_output_0", "outputIndexes": [ 1287 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2567 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 125277248, 2179094, 544768, 0, 0 ] } , "name": "/layers.13/mlp/up_proj/Linear", "outputIndexes": [ 2572 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2572 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2573 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2573 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1288 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1287, 1288 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_13/Mul_output_0", "outputIndexes": [ 1289 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1289 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2574 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2574 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.13/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2575 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2575 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 128001110, 2179094, 544768, 0, 0 ] } , "name": "/layers.13/mlp/down_proj/Linear", "outputIndexes": [ 2576 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2576 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2577 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2577 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.13/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1290 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1284, 1290 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_69_output_0", "outputIndexes": [ 1291 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1291, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_126_output_0", "outputIndexes": [ 1292 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 130724972, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_14/Mul_1_output_0", "outputIndexes": [ 1293 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2578 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2578 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2579 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2579 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 130732140, 401430, 100352, 3584, 0 ] } , "name": "/layers.14/self_attn/q_proj/Linear", "outputIndexes": [ 2580 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2580 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2581 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2581 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1294 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1293 ] , "main_type": "NONE", "name": "/Shape_196_output_0", "outputIndexes": [ 1295 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1295 ] , "main_type": "NONE", "name": "Shape5303", "outputIndexes": [ 1296 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1295 ] , "main_type": "NONE", "name": "Rank5305", "outputIndexes": [ 1297 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1297, 1297 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5307", "outputIndexes": [ 1298 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5308", "outputIndexes": [ 1299 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5310", "outputIndexes": [ 1300 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5311", "outputIndexes": [ 1301 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 1299, 1301, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5314", "outputIndexes": [ 1302 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1302 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5315", "outputIndexes": [ 1303 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1303, 1303 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5317", "outputIndexes": [ 1304 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 1304, 1298 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_213_output_0", "outputIndexes": [ 1305 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_448_output_0", "outputIndexes": [ 1306 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1298 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5325", "outputIndexes": [ 1307 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1300 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5328", "outputIndexes": [ 1308 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1296, 1307, 1308, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5331", "outputIndexes": [ 1309 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1309 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5332", "outputIndexes": [ 1310 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1310 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5333", "outputIndexes": [ 1311 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1311, 1310 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5334", "outputIndexes": [ 1312 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1295, 1312, 1298 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_214_output_0", "outputIndexes": [ 1313 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_449_output_0", "outputIndexes": [ 1314 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1306, 1314, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_182_output_0", "outputIndexes": [ 1315 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1294, 1315 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_127_output_0", "outputIndexes": [ 1316 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_112_output_0", "outputIndexes": [ 1317 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316 ] , "main_type": "NONE", "name": "/Shape_198_output_0", "outputIndexes": [ 1318 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1318 ] , "main_type": "NONE", "name": "Shape5435", "outputIndexes": [ 1319 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1318 ] , "main_type": "NONE", "name": "Rank5437", "outputIndexes": [ 1320 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1320, 1320 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5439", "outputIndexes": [ 1321 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5440", "outputIndexes": [ 1322 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1321, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5442", "outputIndexes": [ 1323 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1323 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5443", "outputIndexes": [ 1324 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1319, 1322, 1324, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5446", "outputIndexes": [ 1325 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1325 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5447", "outputIndexes": [ 1326 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1326 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5448", "outputIndexes": [ 1327 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1327, 1326 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5449", "outputIndexes": [ 1328 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1318, 1328, 1321 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_215_output_0", "outputIndexes": [ 1329 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1329, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_42_output_0", "outputIndexes": [ 1330 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_455_output_0", "outputIndexes": [ 1331 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 1331, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_57_output_0", "outputIndexes": [ 1332 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1332 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_28_output_0", "outputIndexes": [ 1333 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1330, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_454_output_0", "outputIndexes": [ 1334 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1316, 20, 1334, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_56_output_0", "outputIndexes": [ 1335 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1333, 1335 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_185_output_0", "outputIndexes": [ 1336 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1336, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_113_output_0", "outputIndexes": [ 1337 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1317, 1337 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_70_output_0", "outputIndexes": [ 1338 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2579 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131237506, 57366, 14336, 512, 0 ] } , "name": "/layers.14/self_attn/k_proj/Linear", "outputIndexes": [ 2584 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2584 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2585 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2585 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1339 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_450_output_0", "outputIndexes": [ 1340 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_451_output_0", "outputIndexes": [ 1341 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1340, 1341, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_183_output_0", "outputIndexes": [ 1342 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1339, 1342 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_128_output_0", "outputIndexes": [ 1343 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_114_output_0", "outputIndexes": [ 1344 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343 ] , "main_type": "NONE", "name": "/Shape_199_output_0", "outputIndexes": [ 1345 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1345 ] , "main_type": "NONE", "name": "Shape5341", "outputIndexes": [ 1346 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1345 ] , "main_type": "NONE", "name": "Rank5343", "outputIndexes": [ 1347 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1347, 1347 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5345", "outputIndexes": [ 1348 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5346", "outputIndexes": [ 1349 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1348, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5348", "outputIndexes": [ 1350 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1350 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5349", "outputIndexes": [ 1351 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1346, 1349, 1351, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5352", "outputIndexes": [ 1352 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1352 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5353", "outputIndexes": [ 1353 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1353 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5354", "outputIndexes": [ 1354 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1354, 1353 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5355", "outputIndexes": [ 1355 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1345, 1355, 1348 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_216_output_0", "outputIndexes": [ 1356 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1356, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_43_output_0", "outputIndexes": [ 1357 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_457_output_0", "outputIndexes": [ 1358 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 1358, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_59_output_0", "outputIndexes": [ 1359 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1359 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_29_output_0", "outputIndexes": [ 1360 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1357, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_456_output_0", "outputIndexes": [ 1361 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1343, 20, 1361, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_58_output_0", "outputIndexes": [ 1362 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1360, 1362 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_186_output_0", "outputIndexes": [ 1363 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1363, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_115_output_0", "outputIndexes": [ 1364 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1344, 1364 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_71_output_0", "outputIndexes": [ 1365 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2579 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131309720, 57366, 14336, 512, 0 ] } , "name": "/layers.14/self_attn/v_proj/Linear", "outputIndexes": [ 2588 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2588 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2589 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2589 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1366 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1305, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_452_output_0", "outputIndexes": [ 1367 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1313, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_453_output_0", "outputIndexes": [ 1368 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1367, 1368, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_184_output_0", "outputIndexes": [ 1369 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1366, 1369 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_129_output_0", "outputIndexes": [ 1370 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1338, 1365, 1370, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_134_output_0", "outputIndexes": [ 1371 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1371 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2590 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2590 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2591 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2591 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131381934, 401430, 100352, 0, 0 ] } , "name": "/layers.14/self_attn/o_proj/Linear", "outputIndexes": [ 2592 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2592 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2593 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2593 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.14/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1372 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1292, 1372 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_73_output_0", "outputIndexes": [ 1373 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 131883716, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_14/Mul_1_output_0", "outputIndexes": [ 1374 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1374 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2594 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2594 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2595 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2595 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 131890884, 2179094, 544768, 0, 0 ] } , "name": "/layers.14/mlp/gate_proj/Linear", "outputIndexes": [ 2596 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2596 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2597 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2597 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1375 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1375 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_14/Mul_output_0", "outputIndexes": [ 1376 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2595 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 134614746, 2179094, 544768, 0, 0 ] } , "name": "/layers.14/mlp/up_proj/Linear", "outputIndexes": [ 2600 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2600 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2601 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2601 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1377 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1376, 1377 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_14/Mul_output_0", "outputIndexes": [ 1378 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1378 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2602 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2602 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.14/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2603 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2603 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 137338608, 2179094, 544768, 0, 0 ] } , "name": "/layers.14/mlp/down_proj/Linear", "outputIndexes": [ 2604 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2604 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2605 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2605 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.14/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1379 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1373, 1379 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_74_output_0", "outputIndexes": [ 1380 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1380, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_135_output_0", "outputIndexes": [ 1381 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 140062470, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_15/Mul_1_output_0", "outputIndexes": [ 1382 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2606 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2607 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 140069638, 401430, 100352, 3584, 0 ] } , "name": "/layers.15/self_attn/q_proj/Linear", "outputIndexes": [ 2608 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2608 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2609 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2609 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1383 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1382 ] , "main_type": "NONE", "name": "/Shape_210_output_0", "outputIndexes": [ 1384 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1384 ] , "main_type": "NONE", "name": "Shape5674", "outputIndexes": [ 1385 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1384 ] , "main_type": "NONE", "name": "Rank5676", "outputIndexes": [ 1386 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1386, 1386 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5678", "outputIndexes": [ 1387 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5679", "outputIndexes": [ 1388 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5681", "outputIndexes": [ 1389 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5682", "outputIndexes": [ 1390 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1388, 1390, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5685", "outputIndexes": [ 1391 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1391 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5686", "outputIndexes": [ 1392 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1392, 1392 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5688", "outputIndexes": [ 1393 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384, 1393, 1387 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_228_output_0", "outputIndexes": [ 1394 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_480_output_0", "outputIndexes": [ 1395 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1387 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5696", "outputIndexes": [ 1396 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1389 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5699", "outputIndexes": [ 1397 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1385, 1396, 1397, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5702", "outputIndexes": [ 1398 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1398 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5703", "outputIndexes": [ 1399 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1399 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5704", "outputIndexes": [ 1400 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1400, 1399 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5705", "outputIndexes": [ 1401 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1384, 1401, 1387 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_229_output_0", "outputIndexes": [ 1402 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_481_output_0", "outputIndexes": [ 1403 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1395, 1403, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_195_output_0", "outputIndexes": [ 1404 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1383, 1404 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_136_output_0", "outputIndexes": [ 1405 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_120_output_0", "outputIndexes": [ 1406 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405 ] , "main_type": "NONE", "name": "/Shape_212_output_0", "outputIndexes": [ 1407 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1407 ] , "main_type": "NONE", "name": "Shape5806", "outputIndexes": [ 1408 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1407 ] , "main_type": "NONE", "name": "Rank5808", "outputIndexes": [ 1409 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1409, 1409 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5810", "outputIndexes": [ 1410 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5811", "outputIndexes": [ 1411 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1410, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5813", "outputIndexes": [ 1412 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1412 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5814", "outputIndexes": [ 1413 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1408, 1411, 1413, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5817", "outputIndexes": [ 1414 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1414 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5818", "outputIndexes": [ 1415 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1415 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5819", "outputIndexes": [ 1416 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1416, 1415 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5820", "outputIndexes": [ 1417 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1407, 1417, 1410 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_230_output_0", "outputIndexes": [ 1418 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1418, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_45_output_0", "outputIndexes": [ 1419 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_487_output_0", "outputIndexes": [ 1420 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 1420, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_61_output_0", "outputIndexes": [ 1421 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1421 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_30_output_0", "outputIndexes": [ 1422 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1419, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_486_output_0", "outputIndexes": [ 1423 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1405, 20, 1423, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_60_output_0", "outputIndexes": [ 1424 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1422, 1424 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_198_output_0", "outputIndexes": [ 1425 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1425, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_121_output_0", "outputIndexes": [ 1426 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1406, 1426 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_75_output_0", "outputIndexes": [ 1427 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 140575004, 57366, 14336, 512, 0 ] } , "name": "/layers.15/self_attn/k_proj/Linear", "outputIndexes": [ 2612 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2612 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2613 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2613 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1428 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_482_output_0", "outputIndexes": [ 1429 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_483_output_0", "outputIndexes": [ 1430 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1429, 1430, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_196_output_0", "outputIndexes": [ 1431 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1428, 1431 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_137_output_0", "outputIndexes": [ 1432 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_122_output_0", "outputIndexes": [ 1433 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432 ] , "main_type": "NONE", "name": "/Shape_213_output_0", "outputIndexes": [ 1434 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1434 ] , "main_type": "NONE", "name": "Shape5712", "outputIndexes": [ 1435 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1434 ] , "main_type": "NONE", "name": "Rank5714", "outputIndexes": [ 1436 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1436, 1436 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5716", "outputIndexes": [ 1437 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5717", "outputIndexes": [ 1438 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1437, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5719", "outputIndexes": [ 1439 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1439 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze5720", "outputIndexes": [ 1440 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1435, 1438, 1440, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice5723", "outputIndexes": [ 1441 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1441 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze5724", "outputIndexes": [ 1442 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1442 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5725", "outputIndexes": [ 1443 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1443, 1442 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp5726", "outputIndexes": [ 1444 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1434, 1444, 1437 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_231_output_0", "outputIndexes": [ 1445 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1445, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_46_output_0", "outputIndexes": [ 1446 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_489_output_0", "outputIndexes": [ 1447 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 1447, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_63_output_0", "outputIndexes": [ 1448 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1448 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_31_output_0", "outputIndexes": [ 1449 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1446, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_488_output_0", "outputIndexes": [ 1450 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1432, 20, 1450, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_62_output_0", "outputIndexes": [ 1451 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1449, 1451 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_199_output_0", "outputIndexes": [ 1452 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1452, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_123_output_0", "outputIndexes": [ 1453 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1433, 1453 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_76_output_0", "outputIndexes": [ 1454 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2607 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 140647218, 57366, 14336, 512, 0 ] } , "name": "/layers.15/self_attn/v_proj/Linear", "outputIndexes": [ 2616 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2616 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2617 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2617 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1455 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1394, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_484_output_0", "outputIndexes": [ 1456 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1402, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_485_output_0", "outputIndexes": [ 1457 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1456, 1457, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_197_output_0", "outputIndexes": [ 1458 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1455, 1458 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_138_output_0", "outputIndexes": [ 1459 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1427, 1454, 1459, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_143_output_0", "outputIndexes": [ 1460 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1460 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2618 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2618 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2619 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2619 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 140719432, 401430, 100352, 0, 0 ] } , "name": "/layers.15/self_attn/o_proj/Linear", "outputIndexes": [ 2620 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2620 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2621 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2621 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.15/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1461 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1381, 1461 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_78_output_0", "outputIndexes": [ 1462 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 141221214, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_15/Mul_1_output_0", "outputIndexes": [ 1463 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1463 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2622 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2622 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2623 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2623 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 141228382, 2179094, 544768, 0, 0 ] } , "name": "/layers.15/mlp/gate_proj/Linear", "outputIndexes": [ 2624 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2624 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2625 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2625 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1464 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1464 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_15/Mul_output_0", "outputIndexes": [ 1465 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2623 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 143952244, 2179094, 544768, 0, 0 ] } , "name": "/layers.15/mlp/up_proj/Linear", "outputIndexes": [ 2628 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2628 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2629 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2629 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1466 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1465, 1466 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_15/Mul_output_0", "outputIndexes": [ 1467 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1467 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2630 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2630 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.15/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2631 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2631 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 146676106, 2179094, 544768, 0, 0 ] } , "name": "/layers.15/mlp/down_proj/Linear", "outputIndexes": [ 2632 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2632 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2633 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2633 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.15/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1468 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1462, 1468 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_79_output_0", "outputIndexes": [ 1469 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1469, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_144_output_0", "outputIndexes": [ 1470 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 149399968, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_16/Mul_1_output_0", "outputIndexes": [ 1471 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2634 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2634 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2635 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 149407136, 401430, 100352, 3584, 0 ] } , "name": "/layers.16/self_attn/q_proj/Linear", "outputIndexes": [ 2636 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2636 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2637 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2637 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1472 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1471 ] , "main_type": "NONE", "name": "/Shape_224_output_0", "outputIndexes": [ 1473 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1473 ] , "main_type": "NONE", "name": "Shape6045", "outputIndexes": [ 1474 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1473 ] , "main_type": "NONE", "name": "Rank6047", "outputIndexes": [ 1475 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1475, 1475 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6049", "outputIndexes": [ 1476 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6050", "outputIndexes": [ 1477 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6052", "outputIndexes": [ 1478 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6053", "outputIndexes": [ 1479 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474, 1477, 1479, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6056", "outputIndexes": [ 1480 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1480 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6057", "outputIndexes": [ 1481 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1481, 1481 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6059", "outputIndexes": [ 1482 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473, 1482, 1476 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_243_output_0", "outputIndexes": [ 1483 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_512_output_0", "outputIndexes": [ 1484 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1476 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6067", "outputIndexes": [ 1485 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1478 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6070", "outputIndexes": [ 1486 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1474, 1485, 1486, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6073", "outputIndexes": [ 1487 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1487 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6074", "outputIndexes": [ 1488 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1488 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6075", "outputIndexes": [ 1489 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1489, 1488 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6076", "outputIndexes": [ 1490 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1473, 1490, 1476 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_244_output_0", "outputIndexes": [ 1491 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_513_output_0", "outputIndexes": [ 1492 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1484, 1492, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_208_output_0", "outputIndexes": [ 1493 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1472, 1493 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_145_output_0", "outputIndexes": [ 1494 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_128_output_0", "outputIndexes": [ 1495 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494 ] , "main_type": "NONE", "name": "/Shape_226_output_0", "outputIndexes": [ 1496 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "Shape6177", "outputIndexes": [ 1497 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1496 ] , "main_type": "NONE", "name": "Rank6179", "outputIndexes": [ 1498 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1498, 1498 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6181", "outputIndexes": [ 1499 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6182", "outputIndexes": [ 1500 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1499, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6184", "outputIndexes": [ 1501 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1501 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6185", "outputIndexes": [ 1502 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1497, 1500, 1502, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6188", "outputIndexes": [ 1503 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1503 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6189", "outputIndexes": [ 1504 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1504 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6190", "outputIndexes": [ 1505 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1505, 1504 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6191", "outputIndexes": [ 1506 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1496, 1506, 1499 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_245_output_0", "outputIndexes": [ 1507 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1507, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_48_output_0", "outputIndexes": [ 1508 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_519_output_0", "outputIndexes": [ 1509 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 1509, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_65_output_0", "outputIndexes": [ 1510 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1510 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_32_output_0", "outputIndexes": [ 1511 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1508, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_518_output_0", "outputIndexes": [ 1512 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1494, 20, 1512, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_64_output_0", "outputIndexes": [ 1513 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1511, 1513 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_211_output_0", "outputIndexes": [ 1514 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1514, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_129_output_0", "outputIndexes": [ 1515 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1495, 1515 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_80_output_0", "outputIndexes": [ 1516 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 149912502, 57366, 14336, 512, 0 ] } , "name": "/layers.16/self_attn/k_proj/Linear", "outputIndexes": [ 2640 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2640 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2641 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2641 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1517 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_514_output_0", "outputIndexes": [ 1518 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_515_output_0", "outputIndexes": [ 1519 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1518, 1519, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_209_output_0", "outputIndexes": [ 1520 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1517, 1520 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_146_output_0", "outputIndexes": [ 1521 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_130_output_0", "outputIndexes": [ 1522 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521 ] , "main_type": "NONE", "name": "/Shape_227_output_0", "outputIndexes": [ 1523 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1523 ] , "main_type": "NONE", "name": "Shape6083", "outputIndexes": [ 1524 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1523 ] , "main_type": "NONE", "name": "Rank6085", "outputIndexes": [ 1525 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1525, 1525 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6087", "outputIndexes": [ 1526 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6088", "outputIndexes": [ 1527 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1526, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6090", "outputIndexes": [ 1528 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1528 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6091", "outputIndexes": [ 1529 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1524, 1527, 1529, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6094", "outputIndexes": [ 1530 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1530 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6095", "outputIndexes": [ 1531 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1531 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6096", "outputIndexes": [ 1532 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1532, 1531 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6097", "outputIndexes": [ 1533 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1523, 1533, 1526 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_246_output_0", "outputIndexes": [ 1534 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1534, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_49_output_0", "outputIndexes": [ 1535 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_521_output_0", "outputIndexes": [ 1536 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 1536, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_67_output_0", "outputIndexes": [ 1537 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1537 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_33_output_0", "outputIndexes": [ 1538 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1535, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_520_output_0", "outputIndexes": [ 1539 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1521, 20, 1539, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_66_output_0", "outputIndexes": [ 1540 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1538, 1540 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_212_output_0", "outputIndexes": [ 1541 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1541, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_131_output_0", "outputIndexes": [ 1542 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1522, 1542 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_81_output_0", "outputIndexes": [ 1543 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2635 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 149984716, 57366, 14336, 512, 0 ] } , "name": "/layers.16/self_attn/v_proj/Linear", "outputIndexes": [ 2644 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2644 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2645 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2645 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1544 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1483, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_516_output_0", "outputIndexes": [ 1545 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1491, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_517_output_0", "outputIndexes": [ 1546 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1545, 1546, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_210_output_0", "outputIndexes": [ 1547 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1544, 1547 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_147_output_0", "outputIndexes": [ 1548 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1516, 1543, 1548, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_152_output_0", "outputIndexes": [ 1549 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1549 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2646 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2647 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2647 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 150056930, 401430, 100352, 0, 0 ] } , "name": "/layers.16/self_attn/o_proj/Linear", "outputIndexes": [ 2648 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2648 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2649 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2649 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.16/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1550 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1470, 1550 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_83_output_0", "outputIndexes": [ 1551 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 150558712, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_16/Mul_1_output_0", "outputIndexes": [ 1552 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1552 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2650 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2650 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2651 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 150565880, 2179094, 544768, 0, 0 ] } , "name": "/layers.16/mlp/gate_proj/Linear", "outputIndexes": [ 2652 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2652 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2653 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2653 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1553 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1553 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_16/Mul_output_0", "outputIndexes": [ 1554 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2651 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 153289742, 2179094, 544768, 0, 0 ] } , "name": "/layers.16/mlp/up_proj/Linear", "outputIndexes": [ 2656 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2656 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2657 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2657 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1555 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1554, 1555 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_16/Mul_output_0", "outputIndexes": [ 1556 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1556 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2658 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2658 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.16/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2659 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2659 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 156013604, 2179094, 544768, 0, 0 ] } , "name": "/layers.16/mlp/down_proj/Linear", "outputIndexes": [ 2660 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2660 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2661 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2661 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.16/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1557 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1551, 1557 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_84_output_0", "outputIndexes": [ 1558 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1558, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_153_output_0", "outputIndexes": [ 1559 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1559 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 158737466, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_17/Mul_1_output_0", "outputIndexes": [ 1560 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2662 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2662 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2663 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 158744634, 401430, 100352, 3584, 0 ] } , "name": "/layers.17/self_attn/q_proj/Linear", "outputIndexes": [ 2664 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2664 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2665 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2665 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1561 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1560 ] , "main_type": "NONE", "name": "/Shape_238_output_0", "outputIndexes": [ 1562 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Shape6416", "outputIndexes": [ 1563 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1562 ] , "main_type": "NONE", "name": "Rank6418", "outputIndexes": [ 1564 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1564, 1564 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6420", "outputIndexes": [ 1565 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6421", "outputIndexes": [ 1566 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6423", "outputIndexes": [ 1567 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6424", "outputIndexes": [ 1568 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1566, 1568, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6427", "outputIndexes": [ 1569 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1569 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6428", "outputIndexes": [ 1570 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1570, 1570 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6430", "outputIndexes": [ 1571 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562, 1571, 1565 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_258_output_0", "outputIndexes": [ 1572 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_544_output_0", "outputIndexes": [ 1573 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1565 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6438", "outputIndexes": [ 1574 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1567 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6441", "outputIndexes": [ 1575 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1563, 1574, 1575, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6444", "outputIndexes": [ 1576 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1576 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6445", "outputIndexes": [ 1577 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1577 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6446", "outputIndexes": [ 1578 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1578, 1577 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6447", "outputIndexes": [ 1579 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1562, 1579, 1565 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_259_output_0", "outputIndexes": [ 1580 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_545_output_0", "outputIndexes": [ 1581 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1573, 1581, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_221_output_0", "outputIndexes": [ 1582 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1561, 1582 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_154_output_0", "outputIndexes": [ 1583 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_136_output_0", "outputIndexes": [ 1584 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583 ] , "main_type": "NONE", "name": "/Shape_240_output_0", "outputIndexes": [ 1585 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1585 ] , "main_type": "NONE", "name": "Shape6548", "outputIndexes": [ 1586 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1585 ] , "main_type": "NONE", "name": "Rank6550", "outputIndexes": [ 1587 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1587, 1587 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6552", "outputIndexes": [ 1588 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6553", "outputIndexes": [ 1589 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1588, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6555", "outputIndexes": [ 1590 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1590 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6556", "outputIndexes": [ 1591 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1586, 1589, 1591, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6559", "outputIndexes": [ 1592 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1592 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6560", "outputIndexes": [ 1593 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1593 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6561", "outputIndexes": [ 1594 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1594, 1593 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6562", "outputIndexes": [ 1595 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1585, 1595, 1588 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_260_output_0", "outputIndexes": [ 1596 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1596, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_51_output_0", "outputIndexes": [ 1597 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_551_output_0", "outputIndexes": [ 1598 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 1598, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_69_output_0", "outputIndexes": [ 1599 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1599 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_34_output_0", "outputIndexes": [ 1600 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1597, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_550_output_0", "outputIndexes": [ 1601 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1583, 20, 1601, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_68_output_0", "outputIndexes": [ 1602 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1600, 1602 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_224_output_0", "outputIndexes": [ 1603 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1603, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_137_output_0", "outputIndexes": [ 1604 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1584, 1604 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_85_output_0", "outputIndexes": [ 1605 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 159250000, 57366, 14336, 512, 0 ] } , "name": "/layers.17/self_attn/k_proj/Linear", "outputIndexes": [ 2668 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2668 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2669 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2669 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1606 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_546_output_0", "outputIndexes": [ 1607 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_547_output_0", "outputIndexes": [ 1608 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1607, 1608, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_222_output_0", "outputIndexes": [ 1609 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1606, 1609 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_155_output_0", "outputIndexes": [ 1610 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_138_output_0", "outputIndexes": [ 1611 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610 ] , "main_type": "NONE", "name": "/Shape_241_output_0", "outputIndexes": [ 1612 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1612 ] , "main_type": "NONE", "name": "Shape6454", "outputIndexes": [ 1613 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1612 ] , "main_type": "NONE", "name": "Rank6456", "outputIndexes": [ 1614 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1614, 1614 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6458", "outputIndexes": [ 1615 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1615 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6459", "outputIndexes": [ 1616 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1615, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6461", "outputIndexes": [ 1617 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1617 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6462", "outputIndexes": [ 1618 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1613, 1616, 1618, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6465", "outputIndexes": [ 1619 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1619 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6466", "outputIndexes": [ 1620 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1620 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6467", "outputIndexes": [ 1621 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1621, 1620 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6468", "outputIndexes": [ 1622 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1612, 1622, 1615 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_261_output_0", "outputIndexes": [ 1623 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1623, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_52_output_0", "outputIndexes": [ 1624 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_553_output_0", "outputIndexes": [ 1625 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 1625, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_71_output_0", "outputIndexes": [ 1626 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1626 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_35_output_0", "outputIndexes": [ 1627 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1624, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_552_output_0", "outputIndexes": [ 1628 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1610, 20, 1628, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_70_output_0", "outputIndexes": [ 1629 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1627, 1629 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_225_output_0", "outputIndexes": [ 1630 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1630, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_139_output_0", "outputIndexes": [ 1631 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1611, 1631 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_86_output_0", "outputIndexes": [ 1632 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2663 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 159322214, 57366, 14336, 512, 0 ] } , "name": "/layers.17/self_attn/v_proj/Linear", "outputIndexes": [ 2672 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2672 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2673 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2673 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1633 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1572, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_548_output_0", "outputIndexes": [ 1634 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1580, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_549_output_0", "outputIndexes": [ 1635 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1634, 1635, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_223_output_0", "outputIndexes": [ 1636 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1633, 1636 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_156_output_0", "outputIndexes": [ 1637 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1605, 1632, 1637, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_161_output_0", "outputIndexes": [ 1638 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1638 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2674 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2674 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2675 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2675 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 159394428, 401430, 100352, 0, 0 ] } , "name": "/layers.17/self_attn/o_proj/Linear", "outputIndexes": [ 2676 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2676 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2677 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2677 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.17/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1639 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1559, 1639 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_88_output_0", "outputIndexes": [ 1640 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 159896210, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_17/Mul_1_output_0", "outputIndexes": [ 1641 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1641 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2678 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2678 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2679 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 159903378, 2179094, 544768, 0, 0 ] } , "name": "/layers.17/mlp/gate_proj/Linear", "outputIndexes": [ 2680 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2680 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2681 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2681 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1642 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1642 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_17/Mul_output_0", "outputIndexes": [ 1643 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2679 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 162627240, 2179094, 544768, 0, 0 ] } , "name": "/layers.17/mlp/up_proj/Linear", "outputIndexes": [ 2684 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2684 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2685 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2685 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1644 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1643, 1644 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_17/Mul_output_0", "outputIndexes": [ 1645 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1645 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2686 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2686 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.17/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2687 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2687 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 165351102, 2179094, 544768, 0, 0 ] } , "name": "/layers.17/mlp/down_proj/Linear", "outputIndexes": [ 2688 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2688 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2689 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2689 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.17/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1646 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1640, 1646 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_89_output_0", "outputIndexes": [ 1647 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1647, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_162_output_0", "outputIndexes": [ 1648 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 168074964, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_18/Mul_1_output_0", "outputIndexes": [ 1649 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2690 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2690 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2691 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 168082132, 401430, 100352, 3584, 0 ] } , "name": "/layers.18/self_attn/q_proj/Linear", "outputIndexes": [ 2692 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2692 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2693 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2693 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1650 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1649 ] , "main_type": "NONE", "name": "/Shape_252_output_0", "outputIndexes": [ 1651 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1651 ] , "main_type": "NONE", "name": "Shape6787", "outputIndexes": [ 1652 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1651 ] , "main_type": "NONE", "name": "Rank6789", "outputIndexes": [ 1653 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1653, 1653 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6791", "outputIndexes": [ 1654 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6792", "outputIndexes": [ 1655 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6794", "outputIndexes": [ 1656 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6795", "outputIndexes": [ 1657 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1655, 1657, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6798", "outputIndexes": [ 1658 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1658 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6799", "outputIndexes": [ 1659 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1659, 1659 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6801", "outputIndexes": [ 1660 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651, 1660, 1654 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_273_output_0", "outputIndexes": [ 1661 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_576_output_0", "outputIndexes": [ 1662 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1654 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6809", "outputIndexes": [ 1663 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1656 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6812", "outputIndexes": [ 1664 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1652, 1663, 1664, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6815", "outputIndexes": [ 1665 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1665 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6816", "outputIndexes": [ 1666 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1666 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6817", "outputIndexes": [ 1667 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1667, 1666 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6818", "outputIndexes": [ 1668 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1651, 1668, 1654 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_274_output_0", "outputIndexes": [ 1669 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_577_output_0", "outputIndexes": [ 1670 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1662, 1670, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_234_output_0", "outputIndexes": [ 1671 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1650, 1671 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_163_output_0", "outputIndexes": [ 1672 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_144_output_0", "outputIndexes": [ 1673 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672 ] , "main_type": "NONE", "name": "/Shape_254_output_0", "outputIndexes": [ 1674 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1674 ] , "main_type": "NONE", "name": "Shape6919", "outputIndexes": [ 1675 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1674 ] , "main_type": "NONE", "name": "Rank6921", "outputIndexes": [ 1676 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1676, 1676 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6923", "outputIndexes": [ 1677 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6924", "outputIndexes": [ 1678 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1677, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6926", "outputIndexes": [ 1679 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1679 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6927", "outputIndexes": [ 1680 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1675, 1678, 1680, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6930", "outputIndexes": [ 1681 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1681 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6931", "outputIndexes": [ 1682 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1682 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6932", "outputIndexes": [ 1683 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1683, 1682 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6933", "outputIndexes": [ 1684 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1674, 1684, 1677 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_275_output_0", "outputIndexes": [ 1685 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1685, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_54_output_0", "outputIndexes": [ 1686 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_583_output_0", "outputIndexes": [ 1687 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 1687, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_73_output_0", "outputIndexes": [ 1688 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1688 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_36_output_0", "outputIndexes": [ 1689 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1686, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_582_output_0", "outputIndexes": [ 1690 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1672, 20, 1690, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_72_output_0", "outputIndexes": [ 1691 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1689, 1691 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_237_output_0", "outputIndexes": [ 1692 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1692, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_145_output_0", "outputIndexes": [ 1693 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1673, 1693 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_90_output_0", "outputIndexes": [ 1694 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 168587498, 57366, 14336, 512, 0 ] } , "name": "/layers.18/self_attn/k_proj/Linear", "outputIndexes": [ 2696 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2696 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2697 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2697 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1695 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_578_output_0", "outputIndexes": [ 1696 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_579_output_0", "outputIndexes": [ 1697 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1696, 1697, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_235_output_0", "outputIndexes": [ 1698 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1695, 1698 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_164_output_0", "outputIndexes": [ 1699 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_146_output_0", "outputIndexes": [ 1700 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699 ] , "main_type": "NONE", "name": "/Shape_255_output_0", "outputIndexes": [ 1701 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1701 ] , "main_type": "NONE", "name": "Shape6825", "outputIndexes": [ 1702 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1701 ] , "main_type": "NONE", "name": "Rank6827", "outputIndexes": [ 1703 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1703, 1703 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6829", "outputIndexes": [ 1704 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6830", "outputIndexes": [ 1705 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1704, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6832", "outputIndexes": [ 1706 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1706 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze6833", "outputIndexes": [ 1707 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1702, 1705, 1707, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice6836", "outputIndexes": [ 1708 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1708 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze6837", "outputIndexes": [ 1709 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1709 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6838", "outputIndexes": [ 1710 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1710, 1709 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp6839", "outputIndexes": [ 1711 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1701, 1711, 1704 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_276_output_0", "outputIndexes": [ 1712 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1712, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_55_output_0", "outputIndexes": [ 1713 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_585_output_0", "outputIndexes": [ 1714 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 1714, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_75_output_0", "outputIndexes": [ 1715 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1715 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_37_output_0", "outputIndexes": [ 1716 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1713, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_584_output_0", "outputIndexes": [ 1717 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1699, 20, 1717, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_74_output_0", "outputIndexes": [ 1718 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1716, 1718 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_238_output_0", "outputIndexes": [ 1719 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1719, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_147_output_0", "outputIndexes": [ 1720 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1700, 1720 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_91_output_0", "outputIndexes": [ 1721 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2691 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 168659712, 57366, 14336, 512, 0 ] } , "name": "/layers.18/self_attn/v_proj/Linear", "outputIndexes": [ 2700 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2700 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2701 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2701 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1722 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1661, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_580_output_0", "outputIndexes": [ 1723 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1669, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_581_output_0", "outputIndexes": [ 1724 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1723, 1724, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_236_output_0", "outputIndexes": [ 1725 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1722, 1725 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_165_output_0", "outputIndexes": [ 1726 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1694, 1721, 1726, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_170_output_0", "outputIndexes": [ 1727 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1727 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2702 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2702 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2703 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2703 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 168731926, 401430, 100352, 0, 0 ] } , "name": "/layers.18/self_attn/o_proj/Linear", "outputIndexes": [ 2704 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2704 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2705 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2705 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.18/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1728 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1648, 1728 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_93_output_0", "outputIndexes": [ 1729 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 169233708, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_18/Mul_1_output_0", "outputIndexes": [ 1730 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1730 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2706 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2706 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2707 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2707 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 169240876, 2179094, 544768, 0, 0 ] } , "name": "/layers.18/mlp/gate_proj/Linear", "outputIndexes": [ 2708 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2708 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2709 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2709 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1731 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1731 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_18/Mul_output_0", "outputIndexes": [ 1732 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2707 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 171964738, 2179094, 544768, 0, 0 ] } , "name": "/layers.18/mlp/up_proj/Linear", "outputIndexes": [ 2712 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2712 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2713 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2713 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1733 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1732, 1733 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_18/Mul_output_0", "outputIndexes": [ 1734 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1734 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2714 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2714 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.18/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2715 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2715 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 174688600, 2179094, 544768, 0, 0 ] } , "name": "/layers.18/mlp/down_proj/Linear", "outputIndexes": [ 2716 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2716 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2717 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2717 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.18/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1735 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1729, 1735 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_94_output_0", "outputIndexes": [ 1736 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1736, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_171_output_0", "outputIndexes": [ 1737 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 177412462, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_19/Mul_1_output_0", "outputIndexes": [ 1738 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2718 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2718 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2719 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 177419630, 401430, 100352, 3584, 0 ] } , "name": "/layers.19/self_attn/q_proj/Linear", "outputIndexes": [ 2720 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2720 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2721 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2721 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1739 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1738 ] , "main_type": "NONE", "name": "/Shape_266_output_0", "outputIndexes": [ 1740 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1740 ] , "main_type": "NONE", "name": "Shape7158", "outputIndexes": [ 1741 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1740 ] , "main_type": "NONE", "name": "Rank7160", "outputIndexes": [ 1742 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1742, 1742 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7162", "outputIndexes": [ 1743 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7163", "outputIndexes": [ 1744 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7165", "outputIndexes": [ 1745 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7166", "outputIndexes": [ 1746 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1744, 1746, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7169", "outputIndexes": [ 1747 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1747 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7170", "outputIndexes": [ 1748 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1748, 1748 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7172", "outputIndexes": [ 1749 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740, 1749, 1743 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_288_output_0", "outputIndexes": [ 1750 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_608_output_0", "outputIndexes": [ 1751 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1743 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7180", "outputIndexes": [ 1752 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1745 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7183", "outputIndexes": [ 1753 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1741, 1752, 1753, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7186", "outputIndexes": [ 1754 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1754 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7187", "outputIndexes": [ 1755 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1755 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7188", "outputIndexes": [ 1756 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1756, 1755 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7189", "outputIndexes": [ 1757 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1740, 1757, 1743 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_289_output_0", "outputIndexes": [ 1758 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_609_output_0", "outputIndexes": [ 1759 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1751, 1759, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_247_output_0", "outputIndexes": [ 1760 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1739, 1760 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_172_output_0", "outputIndexes": [ 1761 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_152_output_0", "outputIndexes": [ 1762 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761 ] , "main_type": "NONE", "name": "/Shape_268_output_0", "outputIndexes": [ 1763 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1763 ] , "main_type": "NONE", "name": "Shape7290", "outputIndexes": [ 1764 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1763 ] , "main_type": "NONE", "name": "Rank7292", "outputIndexes": [ 1765 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1765, 1765 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7294", "outputIndexes": [ 1766 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7295", "outputIndexes": [ 1767 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1766, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7297", "outputIndexes": [ 1768 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1768 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7298", "outputIndexes": [ 1769 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1764, 1767, 1769, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7301", "outputIndexes": [ 1770 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1770 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7302", "outputIndexes": [ 1771 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1771 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7303", "outputIndexes": [ 1772 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1772, 1771 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7304", "outputIndexes": [ 1773 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1763, 1773, 1766 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_290_output_0", "outputIndexes": [ 1774 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1774, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_57_output_0", "outputIndexes": [ 1775 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_615_output_0", "outputIndexes": [ 1776 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 1776, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_77_output_0", "outputIndexes": [ 1777 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1777 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_38_output_0", "outputIndexes": [ 1778 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1775, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_614_output_0", "outputIndexes": [ 1779 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1761, 20, 1779, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_76_output_0", "outputIndexes": [ 1780 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1778, 1780 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_250_output_0", "outputIndexes": [ 1781 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1781, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_153_output_0", "outputIndexes": [ 1782 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1762, 1782 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_95_output_0", "outputIndexes": [ 1783 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 177924996, 57366, 14336, 512, 0 ] } , "name": "/layers.19/self_attn/k_proj/Linear", "outputIndexes": [ 2724 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2724 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2725 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2725 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1784 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_610_output_0", "outputIndexes": [ 1785 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_611_output_0", "outputIndexes": [ 1786 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1785, 1786, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_248_output_0", "outputIndexes": [ 1787 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1784, 1787 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_173_output_0", "outputIndexes": [ 1788 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_154_output_0", "outputIndexes": [ 1789 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788 ] , "main_type": "NONE", "name": "/Shape_269_output_0", "outputIndexes": [ 1790 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1790 ] , "main_type": "NONE", "name": "Shape7196", "outputIndexes": [ 1791 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1790 ] , "main_type": "NONE", "name": "Rank7198", "outputIndexes": [ 1792 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1792, 1792 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7200", "outputIndexes": [ 1793 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7201", "outputIndexes": [ 1794 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1793, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7203", "outputIndexes": [ 1795 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1795 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7204", "outputIndexes": [ 1796 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1791, 1794, 1796, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7207", "outputIndexes": [ 1797 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1797 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7208", "outputIndexes": [ 1798 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1798 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7209", "outputIndexes": [ 1799 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1799, 1798 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7210", "outputIndexes": [ 1800 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1790, 1800, 1793 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_291_output_0", "outputIndexes": [ 1801 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1801, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_58_output_0", "outputIndexes": [ 1802 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1802, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_617_output_0", "outputIndexes": [ 1803 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 1803, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_79_output_0", "outputIndexes": [ 1804 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1804 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_39_output_0", "outputIndexes": [ 1805 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1802, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_616_output_0", "outputIndexes": [ 1806 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1788, 20, 1806, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_78_output_0", "outputIndexes": [ 1807 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1805, 1807 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_251_output_0", "outputIndexes": [ 1808 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1808, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_155_output_0", "outputIndexes": [ 1809 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1789, 1809 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_96_output_0", "outputIndexes": [ 1810 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2719 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 177997210, 57366, 14336, 512, 0 ] } , "name": "/layers.19/self_attn/v_proj/Linear", "outputIndexes": [ 2728 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2728 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2729 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2729 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1811 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1750, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_612_output_0", "outputIndexes": [ 1812 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1758, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_613_output_0", "outputIndexes": [ 1813 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1812, 1813, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_249_output_0", "outputIndexes": [ 1814 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1811, 1814 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_174_output_0", "outputIndexes": [ 1815 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1783, 1810, 1815, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_179_output_0", "outputIndexes": [ 1816 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1816 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2730 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2730 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2731 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2731 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 178069424, 401430, 100352, 0, 0 ] } , "name": "/layers.19/self_attn/o_proj/Linear", "outputIndexes": [ 2732 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2732 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2733 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2733 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.19/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1817 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1737, 1817 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_98_output_0", "outputIndexes": [ 1818 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 178571206, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_19/Mul_1_output_0", "outputIndexes": [ 1819 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1819 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2734 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2734 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2735 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 178578374, 2179094, 544768, 0, 0 ] } , "name": "/layers.19/mlp/gate_proj/Linear", "outputIndexes": [ 2736 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2736 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2737 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2737 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1820 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1820 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_19/Mul_output_0", "outputIndexes": [ 1821 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2735 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 181302236, 2179094, 544768, 0, 0 ] } , "name": "/layers.19/mlp/up_proj/Linear", "outputIndexes": [ 2740 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2740 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2741 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2741 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1822 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1821, 1822 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_19/Mul_output_0", "outputIndexes": [ 1823 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1823 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2742 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2742 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.19/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2743 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2743 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 184026098, 2179094, 544768, 0, 0 ] } , "name": "/layers.19/mlp/down_proj/Linear", "outputIndexes": [ 2744 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2744 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2745 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2745 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.19/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1824 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1818, 1824 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_99_output_0", "outputIndexes": [ 1825 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1825, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_180_output_0", "outputIndexes": [ 1826 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 186749960, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_20/Mul_1_output_0", "outputIndexes": [ 1827 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2746 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2746 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2747 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 186757128, 401430, 100352, 3584, 0 ] } , "name": "/layers.20/self_attn/q_proj/Linear", "outputIndexes": [ 2748 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2748 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2749 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2749 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1828 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1827 ] , "main_type": "NONE", "name": "/Shape_280_output_0", "outputIndexes": [ 1829 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1829 ] , "main_type": "NONE", "name": "Shape7529", "outputIndexes": [ 1830 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1829 ] , "main_type": "NONE", "name": "Rank7531", "outputIndexes": [ 1831 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1831, 1831 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7533", "outputIndexes": [ 1832 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7534", "outputIndexes": [ 1833 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7536", "outputIndexes": [ 1834 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7537", "outputIndexes": [ 1835 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830, 1833, 1835, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7540", "outputIndexes": [ 1836 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1836 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7541", "outputIndexes": [ 1837 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1837, 1837 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7543", "outputIndexes": [ 1838 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829, 1838, 1832 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_303_output_0", "outputIndexes": [ 1839 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_640_output_0", "outputIndexes": [ 1840 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1832 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7551", "outputIndexes": [ 1841 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1834 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7554", "outputIndexes": [ 1842 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1830, 1841, 1842, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7557", "outputIndexes": [ 1843 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1843 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7558", "outputIndexes": [ 1844 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1844 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7559", "outputIndexes": [ 1845 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1845, 1844 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7560", "outputIndexes": [ 1846 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1829, 1846, 1832 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_304_output_0", "outputIndexes": [ 1847 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_641_output_0", "outputIndexes": [ 1848 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1840, 1848, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_260_output_0", "outputIndexes": [ 1849 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1828, 1849 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_181_output_0", "outputIndexes": [ 1850 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_160_output_0", "outputIndexes": [ 1851 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850 ] , "main_type": "NONE", "name": "/Shape_282_output_0", "outputIndexes": [ 1852 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1852 ] , "main_type": "NONE", "name": "Shape7661", "outputIndexes": [ 1853 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1852 ] , "main_type": "NONE", "name": "Rank7663", "outputIndexes": [ 1854 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1854, 1854 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7665", "outputIndexes": [ 1855 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7666", "outputIndexes": [ 1856 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1855, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7668", "outputIndexes": [ 1857 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1857 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7669", "outputIndexes": [ 1858 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1853, 1856, 1858, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7672", "outputIndexes": [ 1859 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1859 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7673", "outputIndexes": [ 1860 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1860 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7674", "outputIndexes": [ 1861 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1861, 1860 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7675", "outputIndexes": [ 1862 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1852, 1862, 1855 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_305_output_0", "outputIndexes": [ 1863 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1863, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_60_output_0", "outputIndexes": [ 1864 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_647_output_0", "outputIndexes": [ 1865 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 1865, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_81_output_0", "outputIndexes": [ 1866 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1866 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_40_output_0", "outputIndexes": [ 1867 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1864, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_646_output_0", "outputIndexes": [ 1868 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1850, 20, 1868, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_80_output_0", "outputIndexes": [ 1869 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1867, 1869 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_263_output_0", "outputIndexes": [ 1870 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1870, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_161_output_0", "outputIndexes": [ 1871 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1851, 1871 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_100_output_0", "outputIndexes": [ 1872 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187262494, 57366, 14336, 512, 0 ] } , "name": "/layers.20/self_attn/k_proj/Linear", "outputIndexes": [ 2752 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2752 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2753 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2753 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1873 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_642_output_0", "outputIndexes": [ 1874 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_643_output_0", "outputIndexes": [ 1875 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1874, 1875, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_261_output_0", "outputIndexes": [ 1876 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1873, 1876 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_182_output_0", "outputIndexes": [ 1877 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_162_output_0", "outputIndexes": [ 1878 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877 ] , "main_type": "NONE", "name": "/Shape_283_output_0", "outputIndexes": [ 1879 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1879 ] , "main_type": "NONE", "name": "Shape7567", "outputIndexes": [ 1880 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1879 ] , "main_type": "NONE", "name": "Rank7569", "outputIndexes": [ 1881 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1881, 1881 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7571", "outputIndexes": [ 1882 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7572", "outputIndexes": [ 1883 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1882, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7574", "outputIndexes": [ 1884 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1884 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7575", "outputIndexes": [ 1885 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1880, 1883, 1885, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7578", "outputIndexes": [ 1886 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1886 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7579", "outputIndexes": [ 1887 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1887 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7580", "outputIndexes": [ 1888 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1888, 1887 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7581", "outputIndexes": [ 1889 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1879, 1889, 1882 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_306_output_0", "outputIndexes": [ 1890 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1890, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_61_output_0", "outputIndexes": [ 1891 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_649_output_0", "outputIndexes": [ 1892 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 1892, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_83_output_0", "outputIndexes": [ 1893 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1893 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_41_output_0", "outputIndexes": [ 1894 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1891, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_648_output_0", "outputIndexes": [ 1895 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1877, 20, 1895, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_82_output_0", "outputIndexes": [ 1896 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1894, 1896 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_264_output_0", "outputIndexes": [ 1897 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1897, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_163_output_0", "outputIndexes": [ 1898 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1878, 1898 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_101_output_0", "outputIndexes": [ 1899 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2747 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187334708, 57366, 14336, 512, 0 ] } , "name": "/layers.20/self_attn/v_proj/Linear", "outputIndexes": [ 2756 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2756 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2757 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2757 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1900 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1839, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_644_output_0", "outputIndexes": [ 1901 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1847, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_645_output_0", "outputIndexes": [ 1902 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1901, 1902, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_262_output_0", "outputIndexes": [ 1903 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1900, 1903 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_183_output_0", "outputIndexes": [ 1904 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1872, 1899, 1904, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_188_output_0", "outputIndexes": [ 1905 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1905 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2758 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2758 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2759 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2759 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187406922, 401430, 100352, 0, 0 ] } , "name": "/layers.20/self_attn/o_proj/Linear", "outputIndexes": [ 2760 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2760 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2761 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2761 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.20/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1906 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1826, 1906 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_103_output_0", "outputIndexes": [ 1907 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 187908704, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_20/Mul_1_output_0", "outputIndexes": [ 1908 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1908 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2762 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2762 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2763 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2763 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 187915872, 2179094, 544768, 0, 0 ] } , "name": "/layers.20/mlp/gate_proj/Linear", "outputIndexes": [ 2764 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2764 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2765 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2765 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1909 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1909 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_20/Mul_output_0", "outputIndexes": [ 1910 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2763 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 190639734, 2179094, 544768, 0, 0 ] } , "name": "/layers.20/mlp/up_proj/Linear", "outputIndexes": [ 2768 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2768 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2769 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2769 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 1911 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1910, 1911 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_20/Mul_output_0", "outputIndexes": [ 1912 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1912 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2770 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2770 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.20/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2771 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2771 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 193363596, 2179094, 544768, 0, 0 ] } , "name": "/layers.20/mlp/down_proj/Linear", "outputIndexes": [ 2772 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2772 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2773 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2773 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.20/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 1913 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1907, 1913 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_104_output_0", "outputIndexes": [ 1914 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1914, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_189_output_0", "outputIndexes": [ 1915 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1915 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 196087458, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_21/Mul_1_output_0", "outputIndexes": [ 1916 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2774 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2774 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2775 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196094626, 401430, 100352, 3584, 0 ] } , "name": "/layers.21/self_attn/q_proj/Linear", "outputIndexes": [ 2776 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2776 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2777 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2777 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 1917 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1916 ] , "main_type": "NONE", "name": "/Shape_294_output_0", "outputIndexes": [ 1918 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1918 ] , "main_type": "NONE", "name": "Shape7900", "outputIndexes": [ 1919 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1918 ] , "main_type": "NONE", "name": "Rank7902", "outputIndexes": [ 1920 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1920, 1920 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7904", "outputIndexes": [ 1921 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7905", "outputIndexes": [ 1922 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7907", "outputIndexes": [ 1923 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7908", "outputIndexes": [ 1924 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 1922, 1924, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7911", "outputIndexes": [ 1925 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1925 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7912", "outputIndexes": [ 1926 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1926, 1926 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7914", "outputIndexes": [ 1927 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 1927, 1921 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_318_output_0", "outputIndexes": [ 1928 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_672_output_0", "outputIndexes": [ 1929 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1921 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7922", "outputIndexes": [ 1930 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1923 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7925", "outputIndexes": [ 1931 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1919, 1930, 1931, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7928", "outputIndexes": [ 1932 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1932 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7929", "outputIndexes": [ 1933 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 1933 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7930", "outputIndexes": [ 1934 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1934, 1933 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7931", "outputIndexes": [ 1935 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1918, 1935, 1921 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_319_output_0", "outputIndexes": [ 1936 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_673_output_0", "outputIndexes": [ 1937 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1929, 1937, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_273_output_0", "outputIndexes": [ 1938 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1917, 1938 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_190_output_0", "outputIndexes": [ 1939 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_168_output_0", "outputIndexes": [ 1940 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939 ] , "main_type": "NONE", "name": "/Shape_296_output_0", "outputIndexes": [ 1941 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1941 ] , "main_type": "NONE", "name": "Shape8032", "outputIndexes": [ 1942 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1941 ] , "main_type": "NONE", "name": "Rank8034", "outputIndexes": [ 1943 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1943, 1943 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8036", "outputIndexes": [ 1944 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8037", "outputIndexes": [ 1945 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1944, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8039", "outputIndexes": [ 1946 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1946 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8040", "outputIndexes": [ 1947 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1942, 1945, 1947, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8043", "outputIndexes": [ 1948 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1948 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8044", "outputIndexes": [ 1949 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1949 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8045", "outputIndexes": [ 1950 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1950, 1949 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8046", "outputIndexes": [ 1951 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1941, 1951, 1944 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_320_output_0", "outputIndexes": [ 1952 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1952, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_63_output_0", "outputIndexes": [ 1953 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_679_output_0", "outputIndexes": [ 1954 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 1954, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_85_output_0", "outputIndexes": [ 1955 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1955 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_42_output_0", "outputIndexes": [ 1956 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1953, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_678_output_0", "outputIndexes": [ 1957 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1939, 20, 1957, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_84_output_0", "outputIndexes": [ 1958 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1956, 1958 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_276_output_0", "outputIndexes": [ 1959 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1959, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_169_output_0", "outputIndexes": [ 1960 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1940, 1960 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_105_output_0", "outputIndexes": [ 1961 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196599992, 57366, 14336, 512, 0 ] } , "name": "/layers.21/self_attn/k_proj/Linear", "outputIndexes": [ 2780 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2780 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2781 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2781 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 1962 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_674_output_0", "outputIndexes": [ 1963 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_675_output_0", "outputIndexes": [ 1964 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1963, 1964, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_274_output_0", "outputIndexes": [ 1965 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1962, 1965 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_191_output_0", "outputIndexes": [ 1966 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_170_output_0", "outputIndexes": [ 1967 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966 ] , "main_type": "NONE", "name": "/Shape_297_output_0", "outputIndexes": [ 1968 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Shape7938", "outputIndexes": [ 1969 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 1968 ] , "main_type": "NONE", "name": "Rank7940", "outputIndexes": [ 1970 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1970, 1970 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7942", "outputIndexes": [ 1971 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7943", "outputIndexes": [ 1972 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1971, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7945", "outputIndexes": [ 1973 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1973 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze7946", "outputIndexes": [ 1974 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1969, 1972, 1974, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice7949", "outputIndexes": [ 1975 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1975 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze7950", "outputIndexes": [ 1976 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 1976 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7951", "outputIndexes": [ 1977 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1977, 1976 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp7952", "outputIndexes": [ 1978 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1968, 1978, 1971 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_321_output_0", "outputIndexes": [ 1979 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1979, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_64_output_0", "outputIndexes": [ 1980 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1980, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_681_output_0", "outputIndexes": [ 1981 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 1981, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_87_output_0", "outputIndexes": [ 1982 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1982 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_43_output_0", "outputIndexes": [ 1983 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1980, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_680_output_0", "outputIndexes": [ 1984 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1966, 20, 1984, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_86_output_0", "outputIndexes": [ 1985 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1983, 1985 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_277_output_0", "outputIndexes": [ 1986 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1986, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_171_output_0", "outputIndexes": [ 1987 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1967, 1987 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_106_output_0", "outputIndexes": [ 1988 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2775 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196672206, 57366, 14336, 512, 0 ] } , "name": "/layers.21/self_attn/v_proj/Linear", "outputIndexes": [ 2784 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2784 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2785 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2785 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 1989 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1928, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_676_output_0", "outputIndexes": [ 1990 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1936, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_677_output_0", "outputIndexes": [ 1991 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1990, 1991, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_275_output_0", "outputIndexes": [ 1992 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1989, 1992 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_192_output_0", "outputIndexes": [ 1993 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1961, 1988, 1993, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_197_output_0", "outputIndexes": [ 1994 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1994 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2786 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2786 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2787 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2787 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 196744420, 401430, 100352, 0, 0 ] } , "name": "/layers.21/self_attn/o_proj/Linear", "outputIndexes": [ 2788 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2788 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2789 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2789 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.21/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 1995 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1915, 1995 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_108_output_0", "outputIndexes": [ 1996 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 197246202, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_21/Mul_1_output_0", "outputIndexes": [ 1997 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1997 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2790 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2790 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2791 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2791 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 197253370, 2179094, 544768, 0, 0 ] } , "name": "/layers.21/mlp/gate_proj/Linear", "outputIndexes": [ 2792 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2792 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2793 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2793 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 1998 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1998 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_21/Mul_output_0", "outputIndexes": [ 1999 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2791 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 199977232, 2179094, 544768, 0, 0 ] } , "name": "/layers.21/mlp/up_proj/Linear", "outputIndexes": [ 2796 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2796 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2797 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2797 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2000 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1999, 2000 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_21/Mul_output_0", "outputIndexes": [ 2001 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2001 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2798 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2798 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.21/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2799 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2799 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 202701094, 2179094, 544768, 0, 0 ] } , "name": "/layers.21/mlp/down_proj/Linear", "outputIndexes": [ 2800 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2800 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2801 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2801 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.21/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2002 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 1996, 2002 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_109_output_0", "outputIndexes": [ 2003 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2003, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_198_output_0", "outputIndexes": [ 2004 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 205424956, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_22/Mul_1_output_0", "outputIndexes": [ 2005 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2802 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2802 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2803 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 205432124, 401430, 100352, 3584, 0 ] } , "name": "/layers.22/self_attn/q_proj/Linear", "outputIndexes": [ 2804 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2804 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2805 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2805 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2006 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2005 ] , "main_type": "NONE", "name": "/Shape_308_output_0", "outputIndexes": [ 2007 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2007 ] , "main_type": "NONE", "name": "Shape8271", "outputIndexes": [ 2008 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2007 ] , "main_type": "NONE", "name": "Rank8273", "outputIndexes": [ 2009 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2009, 2009 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8275", "outputIndexes": [ 2010 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8276", "outputIndexes": [ 2011 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8278", "outputIndexes": [ 2012 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8279", "outputIndexes": [ 2013 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2011, 2013, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8282", "outputIndexes": [ 2014 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2014 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8283", "outputIndexes": [ 2015 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2015, 2015 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8285", "outputIndexes": [ 2016 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007, 2016, 2010 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_333_output_0", "outputIndexes": [ 2017 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_704_output_0", "outputIndexes": [ 2018 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2010 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8293", "outputIndexes": [ 2019 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2012 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8296", "outputIndexes": [ 2020 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2008, 2019, 2020, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8299", "outputIndexes": [ 2021 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2021 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8300", "outputIndexes": [ 2022 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2022 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8301", "outputIndexes": [ 2023 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2023, 2022 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8302", "outputIndexes": [ 2024 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2007, 2024, 2010 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_334_output_0", "outputIndexes": [ 2025 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_705_output_0", "outputIndexes": [ 2026 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2018, 2026, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_286_output_0", "outputIndexes": [ 2027 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2006, 2027 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_199_output_0", "outputIndexes": [ 2028 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_176_output_0", "outputIndexes": [ 2029 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028 ] , "main_type": "NONE", "name": "/Shape_310_output_0", "outputIndexes": [ 2030 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2030 ] , "main_type": "NONE", "name": "Shape8403", "outputIndexes": [ 2031 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2030 ] , "main_type": "NONE", "name": "Rank8405", "outputIndexes": [ 2032 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2032, 2032 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8407", "outputIndexes": [ 2033 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8408", "outputIndexes": [ 2034 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2033, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8410", "outputIndexes": [ 2035 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2035 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8411", "outputIndexes": [ 2036 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2031, 2034, 2036, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8414", "outputIndexes": [ 2037 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2037 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8415", "outputIndexes": [ 2038 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 2038 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8416", "outputIndexes": [ 2039 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2039, 2038 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8417", "outputIndexes": [ 2040 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2030, 2040, 2033 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_335_output_0", "outputIndexes": [ 2041 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2041, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_66_output_0", "outputIndexes": [ 2042 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2042, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_711_output_0", "outputIndexes": [ 2043 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 2043, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_89_output_0", "outputIndexes": [ 2044 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2044 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_44_output_0", "outputIndexes": [ 2045 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2042, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_710_output_0", "outputIndexes": [ 2046 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2028, 20, 2046, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_88_output_0", "outputIndexes": [ 2047 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2045, 2047 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_289_output_0", "outputIndexes": [ 2048 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2048, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_177_output_0", "outputIndexes": [ 2049 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2029, 2049 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_110_output_0", "outputIndexes": [ 2050 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 205937490, 57366, 14336, 512, 0 ] } , "name": "/layers.22/self_attn/k_proj/Linear", "outputIndexes": [ 2808 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2808 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2809 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2809 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2051 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_706_output_0", "outputIndexes": [ 2052 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_707_output_0", "outputIndexes": [ 2053 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2052, 2053, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_287_output_0", "outputIndexes": [ 2054 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2051, 2054 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_200_output_0", "outputIndexes": [ 2055 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_178_output_0", "outputIndexes": [ 2056 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055 ] , "main_type": "NONE", "name": "/Shape_311_output_0", "outputIndexes": [ 2057 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2057 ] , "main_type": "NONE", "name": "Shape8309", "outputIndexes": [ 2058 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2057 ] , "main_type": "NONE", "name": "Rank8311", "outputIndexes": [ 2059 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2059, 2059 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8313", "outputIndexes": [ 2060 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8314", "outputIndexes": [ 2061 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2060, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8316", "outputIndexes": [ 2062 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2062 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8317", "outputIndexes": [ 2063 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2058, 2061, 2063, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8320", "outputIndexes": [ 2064 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2064 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8321", "outputIndexes": [ 2065 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 2065 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8322", "outputIndexes": [ 2066 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2066, 2065 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8323", "outputIndexes": [ 2067 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2057, 2067, 2060 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_336_output_0", "outputIndexes": [ 2068 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2068, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_67_output_0", "outputIndexes": [ 2069 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2069, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_713_output_0", "outputIndexes": [ 2070 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 2070, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_91_output_0", "outputIndexes": [ 2071 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2071 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_45_output_0", "outputIndexes": [ 2072 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2069, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_712_output_0", "outputIndexes": [ 2073 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2055, 20, 2073, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_90_output_0", "outputIndexes": [ 2074 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2072, 2074 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_290_output_0", "outputIndexes": [ 2075 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2075, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_179_output_0", "outputIndexes": [ 2076 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2056, 2076 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_111_output_0", "outputIndexes": [ 2077 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2803 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 206009704, 57366, 14336, 512, 0 ] } , "name": "/layers.22/self_attn/v_proj/Linear", "outputIndexes": [ 2812 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2812 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2813 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2813 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2078 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2017, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_708_output_0", "outputIndexes": [ 2079 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2025, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_709_output_0", "outputIndexes": [ 2080 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2079, 2080, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_288_output_0", "outputIndexes": [ 2081 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2078, 2081 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_201_output_0", "outputIndexes": [ 2082 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2050, 2077, 2082, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_206_output_0", "outputIndexes": [ 2083 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2083 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2814 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2814 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2815 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2815 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 206081918, 401430, 100352, 0, 0 ] } , "name": "/layers.22/self_attn/o_proj/Linear", "outputIndexes": [ 2816 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2816 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2817 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2817 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.22/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2084 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2004, 2084 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_113_output_0", "outputIndexes": [ 2085 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 206583700, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_22/Mul_1_output_0", "outputIndexes": [ 2086 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2086 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2818 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2818 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2819 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 206590868, 2179094, 544768, 0, 0 ] } , "name": "/layers.22/mlp/gate_proj/Linear", "outputIndexes": [ 2820 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2820 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2821 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2821 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2087 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2087 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_22/Mul_output_0", "outputIndexes": [ 2088 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2819 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 209314730, 2179094, 544768, 0, 0 ] } , "name": "/layers.22/mlp/up_proj/Linear", "outputIndexes": [ 2824 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2824 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2825 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2825 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2089 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2088, 2089 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_22/Mul_output_0", "outputIndexes": [ 2090 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2090 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2826 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2826 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.22/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2827 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2827 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 212038592, 2179094, 544768, 0, 0 ] } , "name": "/layers.22/mlp/down_proj/Linear", "outputIndexes": [ 2828 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2828 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2829 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2829 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.22/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2091 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2085, 2091 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_114_output_0", "outputIndexes": [ 2092 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2092, 3 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_207_output_0", "outputIndexes": [ 2093 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 214762454, 3584, 3584 ] , "useRMSNorm": true } , "name": "/input_layernorm_23/Mul_1_output_0", "outputIndexes": [ 2094 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_reshape", "outputIndexes": [ 2830 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2830 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/q_proj/Linear/pre_convert", "outputIndexes": [ 2831 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 214769622, 401430, 100352, 3584, 0 ] } , "name": "/layers.23/self_attn/q_proj/Linear", "outputIndexes": [ 2832 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2832 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_convert", "outputIndexes": [ 2833 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2833 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/q_proj/Linear/post_reshape", "outputIndexes": [ 2095 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2094 ] , "main_type": "NONE", "name": "/Shape_322_output_0", "outputIndexes": [ 2096 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2096 ] , "main_type": "NONE", "name": "Shape8642", "outputIndexes": [ 2097 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2096 ] , "main_type": "NONE", "name": "Rank8644", "outputIndexes": [ 2098 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2098, 2098 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8646", "outputIndexes": [ 2099 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8647", "outputIndexes": [ 2100 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8649", "outputIndexes": [ 2101 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8650", "outputIndexes": [ 2102 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2100, 2102, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8653", "outputIndexes": [ 2103 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2103 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8654", "outputIndexes": [ 2104 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2104, 2104 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8656", "outputIndexes": [ 2105 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2105, 2099 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_348_output_0", "outputIndexes": [ 2106 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_736_output_0", "outputIndexes": [ 2107 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2099 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8664", "outputIndexes": [ 2108 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2101 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8667", "outputIndexes": [ 2109 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2097, 2108, 2109, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8670", "outputIndexes": [ 2110 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2110 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8671", "outputIndexes": [ 2111 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 12, 2111 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8672", "outputIndexes": [ 2112 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2112, 2111 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8673", "outputIndexes": [ 2113 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2096, 2113, 2099 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_349_output_0", "outputIndexes": [ 2114 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_737_output_0", "outputIndexes": [ 2115 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2107, 2115, 30, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_299_output_0", "outputIndexes": [ 2116 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2095, 2116 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_208_output_0", "outputIndexes": [ 2117 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_184_output_0", "outputIndexes": [ 2118 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117 ] , "main_type": "NONE", "name": "/Shape_324_output_0", "outputIndexes": [ 2119 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "Shape8742", "outputIndexes": [ 2120 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2119 ] , "main_type": "NONE", "name": "Rank8744", "outputIndexes": [ 2121 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2121, 2121 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8746", "outputIndexes": [ 2122 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8747", "outputIndexes": [ 2123 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2122, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8749", "outputIndexes": [ 2124 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2124 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8750", "outputIndexes": [ 2125 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2120, 2123, 2125, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8753", "outputIndexes": [ 2126 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2126 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8754", "outputIndexes": [ 2127 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 2127 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8755", "outputIndexes": [ 2128 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2128, 2127 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8756", "outputIndexes": [ 2129 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2119, 2129, 2122 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_350_output_0", "outputIndexes": [ 2130 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2130, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_69_output_0", "outputIndexes": [ 2131 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2131, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_743_output_0", "outputIndexes": [ 2132 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 2132, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_93_output_0", "outputIndexes": [ 2133 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2133 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_46_output_0", "outputIndexes": [ 2134 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2131, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_742_output_0", "outputIndexes": [ 2135 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2117, 20, 2135, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_92_output_0", "outputIndexes": [ 2136 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2134, 2136 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_302_output_0", "outputIndexes": [ 2137 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2137, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_185_output_0", "outputIndexes": [ 2138 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2118, 2138 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_115_output_0", "outputIndexes": [ 2139 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 215274988, 57366, 14336, 512, 0 ] } , "name": "/layers.23/self_attn/k_proj/Linear", "outputIndexes": [ 2836 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2836 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_convert", "outputIndexes": [ 2837 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2837 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/k_proj/Linear/post_reshape", "outputIndexes": [ 2140 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_738_output_0", "outputIndexes": [ 2141 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_739_output_0", "outputIndexes": [ 2142 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2141, 2142, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_300_output_0", "outputIndexes": [ 2143 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2140, 2143 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_209_output_0", "outputIndexes": [ 2144 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 58 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_186_output_0", "outputIndexes": [ 2145 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144 ] , "main_type": "NONE", "name": "/Shape_325_output_0", "outputIndexes": [ 2146 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2146 ] , "main_type": "NONE", "name": "Shape8680", "outputIndexes": [ 2147 ] , "type": "Shape", "defaultDimentionFormat": "NCHW" } , { "inputIndexes": [ 2146 ] , "main_type": "NONE", "name": "Rank8682", "outputIndexes": [ 2148 ] , "type": "Rank", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2148, 2148 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8684", "outputIndexes": [ 2149 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8685", "outputIndexes": [ 2150 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2149, 12 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8687", "outputIndexes": [ 2151 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2151 ] , "main_type": "SqueezeParam", "main": { "squeezeDims": [ 0 ] } , "name": "Unsqueeze8688", "outputIndexes": [ 2152 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2147, 2150, 2152, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_FLOAT", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 0 } , "name": "StridedSlice8691", "outputIndexes": [ 2153 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2153 ] , "main_type": "SqueezeParam", "main": { } , "name": "Squeeze8692", "outputIndexes": [ 2154 ] , "type": "Squeeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 61, 2154 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8693", "outputIndexes": [ 2155 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2155, 2154 ] , "main_type": "BinaryOp", "main": { "opType": 19, "T": "DT_FLOAT", "activationType": 0 } , "name": "BinaryOp8694", "outputIndexes": [ 2156 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2146, 2156, 2149 ] , "main_type": "GatherV2", "main": { "Taxis": "DT_INVALID", "Tindices": "DT_INVALID", "Tparams": "DT_INVALID" } , "name": "/Gather_351_output_0", "outputIndexes": [ 2157 ] , "type": "GatherV2", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2157, 73 ] , "main_type": "BinaryOp", "main": { "opType": 7, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Div_70_output_0", "outputIndexes": [ 2158 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_745_output_0", "outputIndexes": [ 2159 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 2159, 76, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_95_output_0", "outputIndexes": [ 2160 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2160 ] , "main_type": "UnaryOp", "main": { "opType": "NEG", "T": "DT_FLOAT" } , "name": "/Neg_47_output_0", "outputIndexes": [ 2161 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2158, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_744_output_0", "outputIndexes": [ 2162 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2144, 20, 2162, 77, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/Slice_94_output_0", "outputIndexes": [ 2163 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2161, 2163 ] , "main_type": "Axis", "main": { "axis": -1 } , "name": "/Concat_303_output_0", "outputIndexes": [ 2164 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2164, 89 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Mul_187_output_0", "outputIndexes": [ 2165 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2145, 2165 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_116_output_0", "outputIndexes": [ 2166 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2831 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 128, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 1792, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 215347202, 57366, 14336, 512, 0 ] } , "name": "/layers.23/self_attn/v_proj/Linear", "outputIndexes": [ 2840 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2840 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_convert", "outputIndexes": [ 2841 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2841 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 128 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/v_proj/Linear/post_reshape", "outputIndexes": [ 2167 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2106, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_740_output_0", "outputIndexes": [ 2168 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2114, 20 ] , "main_type": "SqueezeParam", "main": { } , "name": "/Unsqueeze_741_output_0", "outputIndexes": [ 2169 ] , "type": "Unsqueeze", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2168, 2169, 46, 31 ] , "main_type": "Axis", "main": { "axis": 0 } , "name": "/Concat_301_output_0", "outputIndexes": [ 2170 ] , "type": "Concat", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2167, 2170 ] , "main_type": "Reshape", "main": { "dimType": "NCHW" } , "name": "/Reshape_210_output_0", "outputIndexes": [ 2171 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2139, 2166, 2171, 124 ] , "main_type": "AttentionParam", "main": { "kv_cache": true } , "name": "Attention/Reshape_215_output_0", "outputIndexes": [ 2172 ] , "type": "Attention", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2172 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_reshape", "outputIndexes": [ 2842 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2842 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/self_attn/o_proj/Linear/pre_convert", "outputIndexes": [ 2843 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2843 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 12544, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 215419416, 401430, 100352, 0, 0 ] } , "name": "/layers.23/self_attn/o_proj/Linear", "outputIndexes": [ 2844 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2844 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_convert", "outputIndexes": [ 2845 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2845 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.23/self_attn/o_proj/Linear/post_reshape", "outputIndexes": [ 2173 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2093, 2173 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_118_output_0", "outputIndexes": [ 2174 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 215921198, 3584, 3584 ] , "useRMSNorm": true } , "name": "/post_attention_layernorm_23/Mul_1_output_0", "outputIndexes": [ 2175 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2175 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_reshape", "outputIndexes": [ 2846 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2846 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/gate_proj/Linear/pre_convert", "outputIndexes": [ 2847 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2847 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 215928366, 2179094, 544768, 0, 0 ] } , "name": "/layers.23/mlp/gate_proj/Linear", "outputIndexes": [ 2848 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2848 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_convert", "outputIndexes": [ 2849 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2849 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/gate_proj/Linear/post_reshape", "outputIndexes": [ 2176 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2176 ] , "main_type": "UnaryOp", "main": { "opType": "SILU", "T": "DT_INVALID" } , "name": "/mlp/act_fn_23/Mul_output_0", "outputIndexes": [ 2177 ] , "type": "UnaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2847 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 4864, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 218652228, 2179094, 544768, 0, 0 ] } , "name": "/layers.23/mlp/up_proj/Linear", "outputIndexes": [ 2852 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2852 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_convert", "outputIndexes": [ 2853 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2853 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 4864 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/up_proj/Linear/post_reshape", "outputIndexes": [ 2178 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2177, 2178 ] , "main_type": "BinaryOp", "main": { "opType": 2, "T": "DT_FLOAT", "activationType": 0 } , "name": "/mlp_23/Mul_output_0", "outputIndexes": [ 2179 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2179 ] , "main_type": "Reshape", "main": { "dims": [ -1, 4864, 1, 1 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/pre_reshape", "outputIndexes": [ 2854 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2854 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/layers.23/mlp/down_proj/Linear/pre_convert", "outputIndexes": [ 2855 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2855 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 896, "inputCount": 4864, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 4, "aMin": 1, "readType": 68096, "has_scaleInt": false, "shapeInt32": false, "weightSize": 0 } , "external": [ 221376090, 2179094, 544768, 0, 0 ] } , "name": "/layers.23/mlp/down_proj/Linear", "outputIndexes": [ 2856 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2856 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_convert", "outputIndexes": [ 2857 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2857 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 896 ] , "dimType": "NCHW" } , "name": "/layers.23/mlp/down_proj/Linear/post_reshape", "outputIndexes": [ 2180 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2174, 2180 ] , "main_type": "BinaryOp", "main": { "opType": 0, "T": "DT_FLOAT", "activationType": 0 } , "name": "/Add_119_output_0", "outputIndexes": [ 2181 ] , "type": "BinaryOp", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2181, 2182, 76, 15, 15 ] , "main_type": "StridedSliceParam", "main": { "Index": "DT_INVALID", "T": "DT_INVALID", "beginMask": 0, "endMask": 0, "ellipsisMask": 0, "newAxisMask": 0, "shrinkAxisMask": 0, "fromType": 1 } , "name": "/lm/Slice_output_0", "outputIndexes": [ 2183 ] , "type": "StridedSlice", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2183 ] , "main_type": "LayerNorm", "main": { "axis": [ -1 ] , "epsilon": 0.000001, "group": 1, "external": [ 224099952, 3584, 3584 ] , "useRMSNorm": true } , "name": "/lm/norm/Mul_1_output_0", "outputIndexes": [ 2184 ] , "type": "LayerNorm", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2184 ] , "main_type": "Reshape", "main": { "dims": [ -1, 896, 1, 1 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/pre_reshape", "outputIndexes": [ 2858 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2858 ] , "main_type": "TensorConvertInfo", "main": { "source": "NCHW", "dest": "NC4HW4" } , "name": "/lm/lm_head/Linear/pre_convert", "outputIndexes": [ 2859 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2859 ] , "main_type": "Convolution2D", "main": { "common": { "padX": 0, "padY": 0, "kernelX": 1, "kernelY": 1, "strideX": 1, "strideY": 1, "dilateX": 1, "dilateY": 1, "padMode": "CAFFE", "group": 1, "outputCount": 151936, "inputCount": 896, "relu": false, "relu6": false, "hasOutputShape": false } , "quanParameter": { "type": 1, "useInt32": false, "quantScale": 1.0, "scaleIn": 0.0, "scaleOut": 0.0, "aMaxOrBits": 8, "aMin": 1, "readType": 2127104, "has_scaleInt": false, "shapeInt32": true, "weightSize": 0 } , "external": [ 224107120, 136134922, 17016832, 0, 0 ] } , "name": "/lm/lm_head/Linear", "outputIndexes": [ 2860 ] , "type": "Convolution", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2860 ] , "main_type": "TensorConvertInfo", "main": { "source": "NC4HW4", "dest": "NCHW" } , "name": "/lm/lm_head/Linear/post_convert", "outputIndexes": [ 2861 ] , "type": "ConvertTensor", "defaultDimentionFormat": "NHWC" } , { "inputIndexes": [ 2861 ] , "main_type": "Reshape", "main": { "dims": [ 1, -1, 151936 ] , "dimType": "NCHW" } , "name": "/lm/lm_head/Linear/post_reshape", "outputIndexes": [ 2185 ] , "type": "Reshape", "defaultDimentionFormat": "NHWC" } ] , "outputName": [ "logits", "presents" ] , "preferForwardType": "CPU", "sourceType": "ONNX", "tensorName": [ "past_key_values", "presents", "input_ids", "/Constant_output_0", "/Reshape_output_0", "/input_layernorm/Mul_1_output_0", "/FakeLinear_output_0", "/Shape_output_0", "Shape51", "BinaryOp54", "BinaryOp55", "Unsqueeze56", "Const9", "BinaryOp58", "Unsqueeze59", "Unsqueeze61", "StridedSlice62", "BinaryOp64", "BinaryOp65", "/Gather_1_output_0", "/rotary/Constant_4_output_0", "/Unsqueeze_output_0", "Unsqueeze75", "Unsqueeze78", "StridedSlice81", "Squeeze82", "BinaryOp83", "BinaryOp84", "/Gather_2_output_0", "/Unsqueeze_1_output_0", "/Constant_4_output_0", "/Constant_5_output_0", "/Concat_output_0", "/Reshape_1_output_0", "position_ids", "/rotary/Cast_output_0", "/rotary/Constant_1_output_0", "/rotary/Reshape_output_0", "/rotary/Constant_2_output_0", "/rotary/Mul_output_0", "/rotary/Cos_output_0", "/rotary/Unsqueeze_output_0", "/rotary/Sin_output_0", "/rotary/Unsqueeze_1_output_0", "/rotary/Concat_output_0", "/rotary/Concat_1_output_0", "/rotary/Constant_7_output_0", "/rotary/Unsqueeze_2_output_0", "/rotary/Unsqueeze_3_output_0", "Shape106", "BinaryOp109", "BinaryOp110", "Unsqueeze111", "BinaryOp113", "Unsqueeze114", "StridedSlice117", "BinaryOp119", "BinaryOp120", "/Gather_3_output_0", "/Mul_output_0", "/Shape_2_output_0", "/Constant_10_output_0", "Shape238", "BinaryOp241", "BinaryOp242", "Unsqueeze243", "BinaryOp245", "Unsqueeze246", "StridedSlice249", "Squeeze250", "BinaryOp251", "BinaryOp252", "/Gather_5_output_0", "/rotary/Constant_6_output_0", "/Div_output_0", "/Unsqueeze_7_output_0", "/Constant_19_output_0", "/Constant_13_output_0", "/Slice_1_output_0", "/Neg_output_0", "/Unsqueeze_6_output_0", "/Slice_output_0", "/Concat_3_output_0", "Unsqueeze157", "Unsqueeze160", "StridedSlice163", "Squeeze164", "BinaryOp165", "BinaryOp166", "/Gather_4_output_0", "/Mul_1_output_0", "/Add_output_0", "/FakeLinear_1_output_0", "/Unsqueeze_2_output_0", "/Unsqueeze_3_output_0", "/Concat_1_output_0", "/Reshape_2_output_0", "/Mul_2_output_0", "/Shape_3_output_0", "Shape125", "BinaryOp128", "BinaryOp129", "Unsqueeze130", "BinaryOp132", "Unsqueeze133", "StridedSlice136", "Squeeze137", "BinaryOp138", "BinaryOp139", "/Gather_6_output_0", "/Div_1_output_0", "/Unsqueeze_9_output_0", "/Slice_3_output_0", "/Neg_1_output_0", "/Unsqueeze_8_output_0", "/Slice_2_output_0", "/Concat_4_output_0", "/Mul_3_output_0", "/Add_1_output_0", "/FakeLinear_2_output_0", "/Unsqueeze_4_output_0", "/Unsqueeze_5_output_0", "/Concat_2_output_0", "/Reshape_3_output_0", "attention_mask", "/Reshape_8_output_0", "/FakeLinear_3_output_0", "/Add_3_output_0", "/post_attention_layernorm/Mul_1_output_0", "/mlp/gate_proj/FakeLinear_output_0", "/mlp/act_fn/Mul_output_0", "/mlp/up_proj/FakeLinear_output_0", "/mlp/Mul_output_0", "/mlp/down_proj/FakeLinear_output_0", "/Add_4_output_0", "/Reshape_9_output_0", "/input_layernorm_1/Mul_1_output_0", "/FakeLinear_4_output_0", "/Shape_14_output_0", "Shape483", "BinaryOp486", "BinaryOp487", "Unsqueeze488", "BinaryOp490", "Unsqueeze491", "StridedSlice494", "BinaryOp496", "BinaryOp497", "/Gather_18_output_0", "/Unsqueeze_32_output_0", "Unsqueeze505", "Unsqueeze508", "StridedSlice511", "Squeeze512", "BinaryOp513", "BinaryOp514", "/Gather_19_output_0", "/Unsqueeze_33_output_0", "/Concat_13_output_0", "/Reshape_10_output_0", "/Mul_8_output_0", "/Shape_16_output_0", "Shape614", "BinaryOp617", "BinaryOp618", "Unsqueeze619", "BinaryOp621", "Unsqueeze622", "StridedSlice625", "Squeeze626", "BinaryOp627", "BinaryOp628", "/Gather_20_output_0", "/Div_3_output_0", "/Unsqueeze_39_output_0", "/Slice_5_output_0", "/Neg_2_output_0", "/Unsqueeze_38_output_0", "/Slice_4_output_0", "/Concat_16_output_0", "/Mul_9_output_0", "/Add_5_output_0", "/FakeLinear_5_output_0", "/Unsqueeze_34_output_0", "/Unsqueeze_35_output_0", "/Concat_14_output_0", "/Reshape_11_output_0", "/Mul_10_output_0", "/Shape_17_output_0", "Shape521", "BinaryOp524", "BinaryOp525", "Unsqueeze526", "BinaryOp528", "Unsqueeze529", "StridedSlice532", "Squeeze533", "BinaryOp534", "BinaryOp535", "/Gather_21_output_0", "/Div_4_output_0", "/Unsqueeze_41_output_0", "/Slice_7_output_0", "/Neg_3_output_0", "/Unsqueeze_40_output_0", "/Slice_6_output_0", "/Concat_17_output_0", "/Mul_11_output_0", "/Add_6_output_0", "/FakeLinear_6_output_0", "/Unsqueeze_36_output_0", "/Unsqueeze_37_output_0", "/Concat_15_output_0", "/Reshape_12_output_0", "/Reshape_17_output_0", "/FakeLinear_7_output_0", "/Add_8_output_0", "/post_attention_layernorm_1/Mul_1_output_0", "/mlp/gate_proj_1/FakeLinear_output_0", "/mlp/act_fn_1/Mul_output_0", "/mlp/up_proj_1/FakeLinear_output_0", "/mlp_1/Mul_output_0", "/mlp/down_proj_1/FakeLinear_output_0", "/Add_9_output_0", "/Reshape_18_output_0", "/input_layernorm_2/Mul_1_output_0", "/FakeLinear_8_output_0", "/Shape_28_output_0", "Shape853", "BinaryOp856", "BinaryOp857", "Unsqueeze858", "BinaryOp860", "Unsqueeze861", "StridedSlice864", "BinaryOp866", "BinaryOp867", "/Gather_33_output_0", "/Unsqueeze_64_output_0", "Unsqueeze875", "Unsqueeze878", "StridedSlice881", "Squeeze882", "BinaryOp883", "BinaryOp884", "/Gather_34_output_0", "/Unsqueeze_65_output_0", "/Concat_26_output_0", "/Reshape_19_output_0", "/Mul_16_output_0", "/Shape_30_output_0", "Shape984", "BinaryOp987", "BinaryOp988", "Unsqueeze989", "BinaryOp991", "Unsqueeze992", "StridedSlice995", "Squeeze996", "BinaryOp997", "BinaryOp998", "/Gather_35_output_0", "/Div_6_output_0", "/Unsqueeze_71_output_0", "/Slice_9_output_0", "/Neg_4_output_0", "/Unsqueeze_70_output_0", "/Slice_8_output_0", "/Concat_29_output_0", "/Mul_17_output_0", "/Add_10_output_0", "/FakeLinear_9_output_0", "/Unsqueeze_66_output_0", "/Unsqueeze_67_output_0", "/Concat_27_output_0", "/Reshape_20_output_0", "/Mul_18_output_0", "/Shape_31_output_0", "Shape891", "BinaryOp894", "BinaryOp895", "Unsqueeze896", "BinaryOp898", "Unsqueeze899", "StridedSlice902", "Squeeze903", "BinaryOp904", "BinaryOp905", "/Gather_36_output_0", "/Div_7_output_0", "/Unsqueeze_73_output_0", "/Slice_11_output_0", "/Neg_5_output_0", "/Unsqueeze_72_output_0", "/Slice_10_output_0", "/Concat_30_output_0", "/Mul_19_output_0", "/Add_11_output_0", "/FakeLinear_10_output_0", "/Unsqueeze_68_output_0", "/Unsqueeze_69_output_0", "/Concat_28_output_0", "/Reshape_21_output_0", "/Reshape_26_output_0", "/FakeLinear_11_output_0", "/Add_13_output_0", "/post_attention_layernorm_2/Mul_1_output_0", "/mlp/gate_proj_2/FakeLinear_output_0", "/mlp/act_fn_2/Mul_output_0", "/mlp/up_proj_2/FakeLinear_output_0", "/mlp_2/Mul_output_0", "/mlp/down_proj_2/FakeLinear_output_0", "/Add_14_output_0", "/Reshape_27_output_0", "/input_layernorm_3/Mul_1_output_0", "/FakeLinear_12_output_0", "/Shape_42_output_0", "Shape1223", "BinaryOp1226", "BinaryOp1227", "Unsqueeze1228", "BinaryOp1230", "Unsqueeze1231", "StridedSlice1234", "BinaryOp1236", "BinaryOp1237", "/Gather_48_output_0", "/Unsqueeze_96_output_0", "Unsqueeze1245", "Unsqueeze1248", "StridedSlice1251", "Squeeze1252", "BinaryOp1253", "BinaryOp1254", "/Gather_49_output_0", "/Unsqueeze_97_output_0", "/Concat_39_output_0", "/Reshape_28_output_0", "/Mul_24_output_0", "/Shape_44_output_0", "Shape1355", "BinaryOp1358", "BinaryOp1359", "Unsqueeze1360", "BinaryOp1362", "Unsqueeze1363", "StridedSlice1366", "Squeeze1367", "BinaryOp1368", "BinaryOp1369", "/Gather_50_output_0", "/Div_9_output_0", "/Unsqueeze_103_output_0", "/Slice_13_output_0", "/Neg_6_output_0", "/Unsqueeze_102_output_0", "/Slice_12_output_0", "/Concat_42_output_0", "/Mul_25_output_0", "/Add_15_output_0", "/FakeLinear_13_output_0", "/Unsqueeze_98_output_0", "/Unsqueeze_99_output_0", "/Concat_40_output_0", "/Reshape_29_output_0", "/Mul_26_output_0", "/Shape_45_output_0", "Shape1261", "BinaryOp1264", "BinaryOp1265", "Unsqueeze1266", "BinaryOp1268", "Unsqueeze1269", "StridedSlice1272", "Squeeze1273", "BinaryOp1274", "BinaryOp1275", "/Gather_51_output_0", "/Div_10_output_0", "/Unsqueeze_105_output_0", "/Slice_15_output_0", "/Neg_7_output_0", "/Unsqueeze_104_output_0", "/Slice_14_output_0", "/Concat_43_output_0", "/Mul_27_output_0", "/Add_16_output_0", "/FakeLinear_14_output_0", "/Unsqueeze_100_output_0", "/Unsqueeze_101_output_0", "/Concat_41_output_0", "/Reshape_30_output_0", "/Reshape_35_output_0", "/FakeLinear_15_output_0", "/Add_18_output_0", "/post_attention_layernorm_3/Mul_1_output_0", "/mlp/gate_proj_3/FakeLinear_output_0", "/mlp/act_fn_3/Mul_output_0", "/mlp/up_proj_3/FakeLinear_output_0", "/mlp_3/Mul_output_0", "/mlp/down_proj_3/FakeLinear_output_0", "/Add_19_output_0", "/Reshape_36_output_0", "/input_layernorm_4/Mul_1_output_0", "/FakeLinear_16_output_0", "/Shape_56_output_0", "Shape1594", "BinaryOp1597", "BinaryOp1598", "Unsqueeze1599", "BinaryOp1601", "Unsqueeze1602", "StridedSlice1605", "BinaryOp1607", "BinaryOp1608", "/Gather_63_output_0", "/Unsqueeze_128_output_0", "Unsqueeze1616", "Unsqueeze1619", "StridedSlice1622", "Squeeze1623", "BinaryOp1624", "BinaryOp1625", "/Gather_64_output_0", "/Unsqueeze_129_output_0", "/Concat_52_output_0", "/Reshape_37_output_0", "/Mul_32_output_0", "/Shape_58_output_0", "Shape1726", "BinaryOp1729", "BinaryOp1730", "Unsqueeze1731", "BinaryOp1733", "Unsqueeze1734", "StridedSlice1737", "Squeeze1738", "BinaryOp1739", "BinaryOp1740", "/Gather_65_output_0", "/Div_12_output_0", "/Unsqueeze_135_output_0", "/Slice_17_output_0", "/Neg_8_output_0", "/Unsqueeze_134_output_0", "/Slice_16_output_0", "/Concat_55_output_0", "/Mul_33_output_0", "/Add_20_output_0", "/FakeLinear_17_output_0", "/Unsqueeze_130_output_0", "/Unsqueeze_131_output_0", "/Concat_53_output_0", "/Reshape_38_output_0", "/Mul_34_output_0", "/Shape_59_output_0", "Shape1632", "BinaryOp1635", "BinaryOp1636", "Unsqueeze1637", "BinaryOp1639", "Unsqueeze1640", "StridedSlice1643", "Squeeze1644", "BinaryOp1645", "BinaryOp1646", "/Gather_66_output_0", "/Div_13_output_0", "/Unsqueeze_137_output_0", "/Slice_19_output_0", "/Neg_9_output_0", "/Unsqueeze_136_output_0", "/Slice_18_output_0", "/Concat_56_output_0", "/Mul_35_output_0", "/Add_21_output_0", "/FakeLinear_18_output_0", "/Unsqueeze_132_output_0", "/Unsqueeze_133_output_0", "/Concat_54_output_0", "/Reshape_39_output_0", "/Reshape_44_output_0", "/FakeLinear_19_output_0", "/Add_23_output_0", "/post_attention_layernorm_4/Mul_1_output_0", "/mlp/gate_proj_4/FakeLinear_output_0", "/mlp/act_fn_4/Mul_output_0", "/mlp/up_proj_4/FakeLinear_output_0", "/mlp_4/Mul_output_0", "/mlp/down_proj_4/FakeLinear_output_0", "/Add_24_output_0", "/Reshape_45_output_0", "/input_layernorm_5/Mul_1_output_0", "/FakeLinear_20_output_0", "/Shape_70_output_0", "Shape1965", "BinaryOp1968", "BinaryOp1969", "Unsqueeze1970", "BinaryOp1972", "Unsqueeze1973", "StridedSlice1976", "BinaryOp1978", "BinaryOp1979", "/Gather_78_output_0", "/Unsqueeze_160_output_0", "Unsqueeze1987", "Unsqueeze1990", "StridedSlice1993", "Squeeze1994", "BinaryOp1995", "BinaryOp1996", "/Gather_79_output_0", "/Unsqueeze_161_output_0", "/Concat_65_output_0", "/Reshape_46_output_0", "/Mul_40_output_0", "/Shape_72_output_0", "Shape2097", "BinaryOp2100", "BinaryOp2101", "Unsqueeze2102", "BinaryOp2104", "Unsqueeze2105", "StridedSlice2108", "Squeeze2109", "BinaryOp2110", "BinaryOp2111", "/Gather_80_output_0", "/Div_15_output_0", "/Unsqueeze_167_output_0", "/Slice_21_output_0", "/Neg_10_output_0", "/Unsqueeze_166_output_0", "/Slice_20_output_0", "/Concat_68_output_0", "/Mul_41_output_0", "/Add_25_output_0", "/FakeLinear_21_output_0", "/Unsqueeze_162_output_0", "/Unsqueeze_163_output_0", "/Concat_66_output_0", "/Reshape_47_output_0", "/Mul_42_output_0", "/Shape_73_output_0", "Shape2003", "BinaryOp2006", "BinaryOp2007", "Unsqueeze2008", "BinaryOp2010", "Unsqueeze2011", "StridedSlice2014", "Squeeze2015", "BinaryOp2016", "BinaryOp2017", "/Gather_81_output_0", "/Div_16_output_0", "/Unsqueeze_169_output_0", "/Slice_23_output_0", "/Neg_11_output_0", "/Unsqueeze_168_output_0", "/Slice_22_output_0", "/Concat_69_output_0", "/Mul_43_output_0", "/Add_26_output_0", "/FakeLinear_22_output_0", "/Unsqueeze_164_output_0", "/Unsqueeze_165_output_0", "/Concat_67_output_0", "/Reshape_48_output_0", "/Reshape_53_output_0", "/FakeLinear_23_output_0", "/Add_28_output_0", "/post_attention_layernorm_5/Mul_1_output_0", "/mlp/gate_proj_5/FakeLinear_output_0", "/mlp/act_fn_5/Mul_output_0", "/mlp/up_proj_5/FakeLinear_output_0", "/mlp_5/Mul_output_0", "/mlp/down_proj_5/FakeLinear_output_0", "/Add_29_output_0", "/Reshape_54_output_0", "/input_layernorm_6/Mul_1_output_0", "/FakeLinear_24_output_0", "/Shape_84_output_0", "Shape2336", "BinaryOp2339", "BinaryOp2340", "Unsqueeze2341", "BinaryOp2343", "Unsqueeze2344", "StridedSlice2347", "BinaryOp2349", "BinaryOp2350", "/Gather_93_output_0", "/Unsqueeze_192_output_0", "Unsqueeze2358", "Unsqueeze2361", "StridedSlice2364", "Squeeze2365", "BinaryOp2366", "BinaryOp2367", "/Gather_94_output_0", "/Unsqueeze_193_output_0", "/Concat_78_output_0", "/Reshape_55_output_0", "/Mul_48_output_0", "/Shape_86_output_0", "Shape2467", "BinaryOp2470", "BinaryOp2471", "Unsqueeze2472", "BinaryOp2474", "Unsqueeze2475", "StridedSlice2478", "Squeeze2479", "BinaryOp2480", "BinaryOp2481", "/Gather_95_output_0", "/Div_18_output_0", "/Unsqueeze_199_output_0", "/Slice_25_output_0", "/Neg_12_output_0", "/Unsqueeze_198_output_0", "/Slice_24_output_0", "/Concat_81_output_0", "/Mul_49_output_0", "/Add_30_output_0", "/FakeLinear_25_output_0", "/Unsqueeze_194_output_0", "/Unsqueeze_195_output_0", "/Concat_79_output_0", "/Reshape_56_output_0", "/Mul_50_output_0", "/Shape_87_output_0", "Shape2374", "BinaryOp2377", "BinaryOp2378", "Unsqueeze2379", "BinaryOp2381", "Unsqueeze2382", "StridedSlice2385", "Squeeze2386", "BinaryOp2387", "BinaryOp2388", "/Gather_96_output_0", "/Div_19_output_0", "/Unsqueeze_201_output_0", "/Slice_27_output_0", "/Neg_13_output_0", "/Unsqueeze_200_output_0", "/Slice_26_output_0", "/Concat_82_output_0", "/Mul_51_output_0", "/Add_31_output_0", "/FakeLinear_26_output_0", "/Unsqueeze_196_output_0", "/Unsqueeze_197_output_0", "/Concat_80_output_0", "/Reshape_57_output_0", "/Reshape_62_output_0", "/FakeLinear_27_output_0", "/Add_33_output_0", "/post_attention_layernorm_6/Mul_1_output_0", "/mlp/gate_proj_6/FakeLinear_output_0", "/mlp/act_fn_6/Mul_output_0", "/mlp/up_proj_6/FakeLinear_output_0", "/mlp_6/Mul_output_0", "/mlp/down_proj_6/FakeLinear_output_0", "/Add_34_output_0", "/Reshape_63_output_0", "/input_layernorm_7/Mul_1_output_0", "/FakeLinear_28_output_0", "/Shape_98_output_0", "Shape2706", "BinaryOp2709", "BinaryOp2710", "Unsqueeze2711", "BinaryOp2713", "Unsqueeze2714", "StridedSlice2717", "BinaryOp2719", "BinaryOp2720", "/Gather_108_output_0", "/Unsqueeze_224_output_0", "Unsqueeze2728", "Unsqueeze2731", "StridedSlice2734", "Squeeze2735", "BinaryOp2736", "BinaryOp2737", "/Gather_109_output_0", "/Unsqueeze_225_output_0", "/Concat_91_output_0", "/Reshape_64_output_0", "/Mul_56_output_0", "/Shape_100_output_0", "Shape2838", "BinaryOp2841", "BinaryOp2842", "Unsqueeze2843", "BinaryOp2845", "Unsqueeze2846", "StridedSlice2849", "Squeeze2850", "BinaryOp2851", "BinaryOp2852", "/Gather_110_output_0", "/Div_21_output_0", "/Unsqueeze_231_output_0", "/Slice_29_output_0", "/Neg_14_output_0", "/Unsqueeze_230_output_0", "/Slice_28_output_0", "/Concat_94_output_0", "/Mul_57_output_0", "/Add_35_output_0", "/FakeLinear_29_output_0", "/Unsqueeze_226_output_0", "/Unsqueeze_227_output_0", "/Concat_92_output_0", "/Reshape_65_output_0", "/Mul_58_output_0", "/Shape_101_output_0", "Shape2744", "BinaryOp2747", "BinaryOp2748", "Unsqueeze2749", "BinaryOp2751", "Unsqueeze2752", "StridedSlice2755", "Squeeze2756", "BinaryOp2757", "BinaryOp2758", "/Gather_111_output_0", "/Div_22_output_0", "/Unsqueeze_233_output_0", "/Slice_31_output_0", "/Neg_15_output_0", "/Unsqueeze_232_output_0", "/Slice_30_output_0", "/Concat_95_output_0", "/Mul_59_output_0", "/Add_36_output_0", "/FakeLinear_30_output_0", "/Unsqueeze_228_output_0", "/Unsqueeze_229_output_0", "/Concat_93_output_0", "/Reshape_66_output_0", "/Reshape_71_output_0", "/FakeLinear_31_output_0", "/Add_38_output_0", "/post_attention_layernorm_7/Mul_1_output_0", "/mlp/gate_proj_7/FakeLinear_output_0", "/mlp/act_fn_7/Mul_output_0", "/mlp/up_proj_7/FakeLinear_output_0", "/mlp_7/Mul_output_0", "/mlp/down_proj_7/FakeLinear_output_0", "/Add_39_output_0", "/Reshape_72_output_0", "/input_layernorm_8/Mul_1_output_0", "/FakeLinear_32_output_0", "/Shape_112_output_0", "Shape3077", "BinaryOp3080", "BinaryOp3081", "Unsqueeze3082", "BinaryOp3084", "Unsqueeze3085", "StridedSlice3088", "BinaryOp3090", "BinaryOp3091", "/Gather_123_output_0", "/Unsqueeze_256_output_0", "Unsqueeze3099", "Unsqueeze3102", "StridedSlice3105", "Squeeze3106", "BinaryOp3107", "BinaryOp3108", "/Gather_124_output_0", "/Unsqueeze_257_output_0", "/Concat_104_output_0", "/Reshape_73_output_0", "/Mul_64_output_0", "/Shape_114_output_0", "Shape3209", "BinaryOp3212", "BinaryOp3213", "Unsqueeze3214", "BinaryOp3216", "Unsqueeze3217", "StridedSlice3220", "Squeeze3221", "BinaryOp3222", "BinaryOp3223", "/Gather_125_output_0", "/Div_24_output_0", "/Unsqueeze_263_output_0", "/Slice_33_output_0", "/Neg_16_output_0", "/Unsqueeze_262_output_0", "/Slice_32_output_0", "/Concat_107_output_0", "/Mul_65_output_0", "/Add_40_output_0", "/FakeLinear_33_output_0", "/Unsqueeze_258_output_0", "/Unsqueeze_259_output_0", "/Concat_105_output_0", "/Reshape_74_output_0", "/Mul_66_output_0", "/Shape_115_output_0", "Shape3115", "BinaryOp3118", "BinaryOp3119", "Unsqueeze3120", "BinaryOp3122", "Unsqueeze3123", "StridedSlice3126", "Squeeze3127", "BinaryOp3128", "BinaryOp3129", "/Gather_126_output_0", "/Div_25_output_0", "/Unsqueeze_265_output_0", "/Slice_35_output_0", "/Neg_17_output_0", "/Unsqueeze_264_output_0", "/Slice_34_output_0", "/Concat_108_output_0", "/Mul_67_output_0", "/Add_41_output_0", "/FakeLinear_34_output_0", "/Unsqueeze_260_output_0", "/Unsqueeze_261_output_0", "/Concat_106_output_0", "/Reshape_75_output_0", "/Reshape_80_output_0", "/FakeLinear_35_output_0", "/Add_43_output_0", "/post_attention_layernorm_8/Mul_1_output_0", "/mlp/gate_proj_8/FakeLinear_output_0", "/mlp/act_fn_8/Mul_output_0", "/mlp/up_proj_8/FakeLinear_output_0", "/mlp_8/Mul_output_0", "/mlp/down_proj_8/FakeLinear_output_0", "/Add_44_output_0", "/Reshape_81_output_0", "/input_layernorm_9/Mul_1_output_0", "/FakeLinear_36_output_0", "/Shape_126_output_0", "Shape3448", "BinaryOp3451", "BinaryOp3452", "Unsqueeze3453", "BinaryOp3455", "Unsqueeze3456", "StridedSlice3459", "BinaryOp3461", "BinaryOp3462", "/Gather_138_output_0", "/Unsqueeze_288_output_0", "Unsqueeze3470", "Unsqueeze3473", "StridedSlice3476", "Squeeze3477", "BinaryOp3478", "BinaryOp3479", "/Gather_139_output_0", "/Unsqueeze_289_output_0", "/Concat_117_output_0", "/Reshape_82_output_0", "/Mul_72_output_0", "/Shape_128_output_0", "Shape3580", "BinaryOp3583", "BinaryOp3584", "Unsqueeze3585", "BinaryOp3587", "Unsqueeze3588", "StridedSlice3591", "Squeeze3592", "BinaryOp3593", "BinaryOp3594", "/Gather_140_output_0", "/Div_27_output_0", "/Unsqueeze_295_output_0", "/Slice_37_output_0", "/Neg_18_output_0", "/Unsqueeze_294_output_0", "/Slice_36_output_0", "/Concat_120_output_0", "/Mul_73_output_0", "/Add_45_output_0", "/FakeLinear_37_output_0", "/Unsqueeze_290_output_0", "/Unsqueeze_291_output_0", "/Concat_118_output_0", "/Reshape_83_output_0", "/Mul_74_output_0", "/Shape_129_output_0", "Shape3486", "BinaryOp3489", "BinaryOp3490", "Unsqueeze3491", "BinaryOp3493", "Unsqueeze3494", "StridedSlice3497", "Squeeze3498", "BinaryOp3499", "BinaryOp3500", "/Gather_141_output_0", "/Div_28_output_0", "/Unsqueeze_297_output_0", "/Slice_39_output_0", "/Neg_19_output_0", "/Unsqueeze_296_output_0", "/Slice_38_output_0", "/Concat_121_output_0", "/Mul_75_output_0", "/Add_46_output_0", "/FakeLinear_38_output_0", "/Unsqueeze_292_output_0", "/Unsqueeze_293_output_0", "/Concat_119_output_0", "/Reshape_84_output_0", "/Reshape_89_output_0", "/FakeLinear_39_output_0", "/Add_48_output_0", "/post_attention_layernorm_9/Mul_1_output_0", "/mlp/gate_proj_9/FakeLinear_output_0", "/mlp/act_fn_9/Mul_output_0", "/mlp/up_proj_9/FakeLinear_output_0", "/mlp_9/Mul_output_0", "/mlp/down_proj_9/FakeLinear_output_0", "/Add_49_output_0", "/Reshape_90_output_0", "/input_layernorm_10/Mul_1_output_0", "/FakeLinear_40_output_0", "/Shape_140_output_0", "Shape3819", "BinaryOp3822", "BinaryOp3823", "Unsqueeze3824", "BinaryOp3826", "Unsqueeze3827", "StridedSlice3830", "BinaryOp3832", "BinaryOp3833", "/Gather_153_output_0", "/Unsqueeze_320_output_0", "Unsqueeze3841", "Unsqueeze3844", "StridedSlice3847", "Squeeze3848", "BinaryOp3849", "BinaryOp3850", "/Gather_154_output_0", "/Unsqueeze_321_output_0", "/Concat_130_output_0", "/Reshape_91_output_0", "/Mul_80_output_0", "/Shape_142_output_0", "Shape3951", "BinaryOp3954", "BinaryOp3955", "Unsqueeze3956", "BinaryOp3958", "Unsqueeze3959", "StridedSlice3962", "Squeeze3963", "BinaryOp3964", "BinaryOp3965", "/Gather_155_output_0", "/Div_30_output_0", "/Unsqueeze_327_output_0", "/Slice_41_output_0", "/Neg_20_output_0", "/Unsqueeze_326_output_0", "/Slice_40_output_0", "/Concat_133_output_0", "/Mul_81_output_0", "/Add_50_output_0", "/FakeLinear_41_output_0", "/Unsqueeze_322_output_0", "/Unsqueeze_323_output_0", "/Concat_131_output_0", "/Reshape_92_output_0", "/Mul_82_output_0", "/Shape_143_output_0", "Shape3857", "BinaryOp3860", "BinaryOp3861", "Unsqueeze3862", "BinaryOp3864", "Unsqueeze3865", "StridedSlice3868", "Squeeze3869", "BinaryOp3870", "BinaryOp3871", "/Gather_156_output_0", "/Div_31_output_0", "/Unsqueeze_329_output_0", "/Slice_43_output_0", "/Neg_21_output_0", "/Unsqueeze_328_output_0", "/Slice_42_output_0", "/Concat_134_output_0", "/Mul_83_output_0", "/Add_51_output_0", "/FakeLinear_42_output_0", "/Unsqueeze_324_output_0", "/Unsqueeze_325_output_0", "/Concat_132_output_0", "/Reshape_93_output_0", "/Reshape_98_output_0", "/FakeLinear_43_output_0", "/Add_53_output_0", "/post_attention_layernorm_10/Mul_1_output_0", "/mlp/gate_proj_10/FakeLinear_output_0", "/mlp/act_fn_10/Mul_output_0", "/mlp/up_proj_10/FakeLinear_output_0", "/mlp_10/Mul_output_0", "/mlp/down_proj_10/FakeLinear_output_0", "/Add_54_output_0", "/Reshape_99_output_0", "/input_layernorm_11/Mul_1_output_0", "/FakeLinear_44_output_0", "/Shape_154_output_0", "Shape4190", "BinaryOp4193", "BinaryOp4194", "Unsqueeze4195", "BinaryOp4197", "Unsqueeze4198", "StridedSlice4201", "BinaryOp4203", "BinaryOp4204", "/Gather_168_output_0", "/Unsqueeze_352_output_0", "Unsqueeze4212", "Unsqueeze4215", "StridedSlice4218", "Squeeze4219", "BinaryOp4220", "BinaryOp4221", "/Gather_169_output_0", "/Unsqueeze_353_output_0", "/Concat_143_output_0", "/Reshape_100_output_0", "/Mul_88_output_0", "/Shape_156_output_0", "Shape4322", "BinaryOp4325", "BinaryOp4326", "Unsqueeze4327", "BinaryOp4329", "Unsqueeze4330", "StridedSlice4333", "Squeeze4334", "BinaryOp4335", "BinaryOp4336", "/Gather_170_output_0", "/Div_33_output_0", "/Unsqueeze_359_output_0", "/Slice_45_output_0", "/Neg_22_output_0", "/Unsqueeze_358_output_0", "/Slice_44_output_0", "/Concat_146_output_0", "/Mul_89_output_0", "/Add_55_output_0", "/FakeLinear_45_output_0", "/Unsqueeze_354_output_0", "/Unsqueeze_355_output_0", "/Concat_144_output_0", "/Reshape_101_output_0", "/Mul_90_output_0", "/Shape_157_output_0", "Shape4228", "BinaryOp4231", "BinaryOp4232", "Unsqueeze4233", "BinaryOp4235", "Unsqueeze4236", "StridedSlice4239", "Squeeze4240", "BinaryOp4241", "BinaryOp4242", "/Gather_171_output_0", "/Div_34_output_0", "/Unsqueeze_361_output_0", "/Slice_47_output_0", "/Neg_23_output_0", "/Unsqueeze_360_output_0", "/Slice_46_output_0", "/Concat_147_output_0", "/Mul_91_output_0", "/Add_56_output_0", "/FakeLinear_46_output_0", "/Unsqueeze_356_output_0", "/Unsqueeze_357_output_0", "/Concat_145_output_0", "/Reshape_102_output_0", "/Reshape_107_output_0", "/FakeLinear_47_output_0", "/Add_58_output_0", "/post_attention_layernorm_11/Mul_1_output_0", "/mlp/gate_proj_11/FakeLinear_output_0", "/mlp/act_fn_11/Mul_output_0", "/mlp/up_proj_11/FakeLinear_output_0", "/mlp_11/Mul_output_0", "/mlp/down_proj_11/FakeLinear_output_0", "/Add_59_output_0", "/Reshape_108_output_0", "/input_layernorm_12/Mul_1_output_0", "/FakeLinear_48_output_0", "/Shape_168_output_0", "Shape4561", "BinaryOp4564", "BinaryOp4565", "Unsqueeze4566", "BinaryOp4568", "Unsqueeze4569", "StridedSlice4572", "BinaryOp4574", "BinaryOp4575", "/Gather_183_output_0", "/Unsqueeze_384_output_0", "Unsqueeze4583", "Unsqueeze4586", "StridedSlice4589", "Squeeze4590", "BinaryOp4591", "BinaryOp4592", "/Gather_184_output_0", "/Unsqueeze_385_output_0", "/Concat_156_output_0", "/Reshape_109_output_0", "/Mul_96_output_0", "/Shape_170_output_0", "Shape4693", "BinaryOp4696", "BinaryOp4697", "Unsqueeze4698", "BinaryOp4700", "Unsqueeze4701", "StridedSlice4704", "Squeeze4705", "BinaryOp4706", "BinaryOp4707", "/Gather_185_output_0", "/Div_36_output_0", "/Unsqueeze_391_output_0", "/Slice_49_output_0", "/Neg_24_output_0", "/Unsqueeze_390_output_0", "/Slice_48_output_0", "/Concat_159_output_0", "/Mul_97_output_0", "/Add_60_output_0", "/FakeLinear_49_output_0", "/Unsqueeze_386_output_0", "/Unsqueeze_387_output_0", "/Concat_157_output_0", "/Reshape_110_output_0", "/Mul_98_output_0", "/Shape_171_output_0", "Shape4599", "BinaryOp4602", "BinaryOp4603", "Unsqueeze4604", "BinaryOp4606", "Unsqueeze4607", "StridedSlice4610", "Squeeze4611", "BinaryOp4612", "BinaryOp4613", "/Gather_186_output_0", "/Div_37_output_0", "/Unsqueeze_393_output_0", "/Slice_51_output_0", "/Neg_25_output_0", "/Unsqueeze_392_output_0", "/Slice_50_output_0", "/Concat_160_output_0", "/Mul_99_output_0", "/Add_61_output_0", "/FakeLinear_50_output_0", "/Unsqueeze_388_output_0", "/Unsqueeze_389_output_0", "/Concat_158_output_0", "/Reshape_111_output_0", "/Reshape_116_output_0", "/FakeLinear_51_output_0", "/Add_63_output_0", "/post_attention_layernorm_12/Mul_1_output_0", "/mlp/gate_proj_12/FakeLinear_output_0", "/mlp/act_fn_12/Mul_output_0", "/mlp/up_proj_12/FakeLinear_output_0", "/mlp_12/Mul_output_0", "/mlp/down_proj_12/FakeLinear_output_0", "/Add_64_output_0", "/Reshape_117_output_0", "/input_layernorm_13/Mul_1_output_0", "/FakeLinear_52_output_0", "/Shape_182_output_0", "Shape4932", "BinaryOp4935", "BinaryOp4936", "Unsqueeze4937", "BinaryOp4939", "Unsqueeze4940", "StridedSlice4943", "BinaryOp4945", "BinaryOp4946", "/Gather_198_output_0", "/Unsqueeze_416_output_0", "Unsqueeze4954", "Unsqueeze4957", "StridedSlice4960", "Squeeze4961", "BinaryOp4962", "BinaryOp4963", "/Gather_199_output_0", "/Unsqueeze_417_output_0", "/Concat_169_output_0", "/Reshape_118_output_0", "/Mul_104_output_0", "/Shape_184_output_0", "Shape5064", "BinaryOp5067", "BinaryOp5068", "Unsqueeze5069", "BinaryOp5071", "Unsqueeze5072", "StridedSlice5075", "Squeeze5076", "BinaryOp5077", "BinaryOp5078", "/Gather_200_output_0", "/Div_39_output_0", "/Unsqueeze_423_output_0", "/Slice_53_output_0", "/Neg_26_output_0", "/Unsqueeze_422_output_0", "/Slice_52_output_0", "/Concat_172_output_0", "/Mul_105_output_0", "/Add_65_output_0", "/FakeLinear_53_output_0", "/Unsqueeze_418_output_0", "/Unsqueeze_419_output_0", "/Concat_170_output_0", "/Reshape_119_output_0", "/Mul_106_output_0", "/Shape_185_output_0", "Shape4970", "BinaryOp4973", "BinaryOp4974", "Unsqueeze4975", "BinaryOp4977", "Unsqueeze4978", "StridedSlice4981", "Squeeze4982", "BinaryOp4983", "BinaryOp4984", "/Gather_201_output_0", "/Div_40_output_0", "/Unsqueeze_425_output_0", "/Slice_55_output_0", "/Neg_27_output_0", "/Unsqueeze_424_output_0", "/Slice_54_output_0", "/Concat_173_output_0", "/Mul_107_output_0", "/Add_66_output_0", "/FakeLinear_54_output_0", "/Unsqueeze_420_output_0", "/Unsqueeze_421_output_0", "/Concat_171_output_0", "/Reshape_120_output_0", "/Reshape_125_output_0", "/FakeLinear_55_output_0", "/Add_68_output_0", "/post_attention_layernorm_13/Mul_1_output_0", "/mlp/gate_proj_13/FakeLinear_output_0", "/mlp/act_fn_13/Mul_output_0", "/mlp/up_proj_13/FakeLinear_output_0", "/mlp_13/Mul_output_0", "/mlp/down_proj_13/FakeLinear_output_0", "/Add_69_output_0", "/Reshape_126_output_0", "/input_layernorm_14/Mul_1_output_0", "/FakeLinear_56_output_0", "/Shape_196_output_0", "Shape5303", "BinaryOp5306", "BinaryOp5307", "Unsqueeze5308", "BinaryOp5310", "Unsqueeze5311", "StridedSlice5314", "BinaryOp5316", "BinaryOp5317", "/Gather_213_output_0", "/Unsqueeze_448_output_0", "Unsqueeze5325", "Unsqueeze5328", "StridedSlice5331", "Squeeze5332", "BinaryOp5333", "BinaryOp5334", "/Gather_214_output_0", "/Unsqueeze_449_output_0", "/Concat_182_output_0", "/Reshape_127_output_0", "/Mul_112_output_0", "/Shape_198_output_0", "Shape5435", "BinaryOp5438", "BinaryOp5439", "Unsqueeze5440", "BinaryOp5442", "Unsqueeze5443", "StridedSlice5446", "Squeeze5447", "BinaryOp5448", "BinaryOp5449", "/Gather_215_output_0", "/Div_42_output_0", "/Unsqueeze_455_output_0", "/Slice_57_output_0", "/Neg_28_output_0", "/Unsqueeze_454_output_0", "/Slice_56_output_0", "/Concat_185_output_0", "/Mul_113_output_0", "/Add_70_output_0", "/FakeLinear_57_output_0", "/Unsqueeze_450_output_0", "/Unsqueeze_451_output_0", "/Concat_183_output_0", "/Reshape_128_output_0", "/Mul_114_output_0", "/Shape_199_output_0", "Shape5341", "BinaryOp5344", "BinaryOp5345", "Unsqueeze5346", "BinaryOp5348", "Unsqueeze5349", "StridedSlice5352", "Squeeze5353", "BinaryOp5354", "BinaryOp5355", "/Gather_216_output_0", "/Div_43_output_0", "/Unsqueeze_457_output_0", "/Slice_59_output_0", "/Neg_29_output_0", "/Unsqueeze_456_output_0", "/Slice_58_output_0", "/Concat_186_output_0", "/Mul_115_output_0", "/Add_71_output_0", "/FakeLinear_58_output_0", "/Unsqueeze_452_output_0", "/Unsqueeze_453_output_0", "/Concat_184_output_0", "/Reshape_129_output_0", "/Reshape_134_output_0", "/FakeLinear_59_output_0", "/Add_73_output_0", "/post_attention_layernorm_14/Mul_1_output_0", "/mlp/gate_proj_14/FakeLinear_output_0", "/mlp/act_fn_14/Mul_output_0", "/mlp/up_proj_14/FakeLinear_output_0", "/mlp_14/Mul_output_0", "/mlp/down_proj_14/FakeLinear_output_0", "/Add_74_output_0", "/Reshape_135_output_0", "/input_layernorm_15/Mul_1_output_0", "/FakeLinear_60_output_0", "/Shape_210_output_0", "Shape5674", "BinaryOp5677", "BinaryOp5678", "Unsqueeze5679", "BinaryOp5681", "Unsqueeze5682", "StridedSlice5685", "BinaryOp5687", "BinaryOp5688", "/Gather_228_output_0", "/Unsqueeze_480_output_0", "Unsqueeze5696", "Unsqueeze5699", "StridedSlice5702", "Squeeze5703", "BinaryOp5704", "BinaryOp5705", "/Gather_229_output_0", "/Unsqueeze_481_output_0", "/Concat_195_output_0", "/Reshape_136_output_0", "/Mul_120_output_0", "/Shape_212_output_0", "Shape5806", "BinaryOp5809", "BinaryOp5810", "Unsqueeze5811", "BinaryOp5813", "Unsqueeze5814", "StridedSlice5817", "Squeeze5818", "BinaryOp5819", "BinaryOp5820", "/Gather_230_output_0", "/Div_45_output_0", "/Unsqueeze_487_output_0", "/Slice_61_output_0", "/Neg_30_output_0", "/Unsqueeze_486_output_0", "/Slice_60_output_0", "/Concat_198_output_0", "/Mul_121_output_0", "/Add_75_output_0", "/FakeLinear_61_output_0", "/Unsqueeze_482_output_0", "/Unsqueeze_483_output_0", "/Concat_196_output_0", "/Reshape_137_output_0", "/Mul_122_output_0", "/Shape_213_output_0", "Shape5712", "BinaryOp5715", "BinaryOp5716", "Unsqueeze5717", "BinaryOp5719", "Unsqueeze5720", "StridedSlice5723", "Squeeze5724", "BinaryOp5725", "BinaryOp5726", "/Gather_231_output_0", "/Div_46_output_0", "/Unsqueeze_489_output_0", "/Slice_63_output_0", "/Neg_31_output_0", "/Unsqueeze_488_output_0", "/Slice_62_output_0", "/Concat_199_output_0", "/Mul_123_output_0", "/Add_76_output_0", "/FakeLinear_62_output_0", "/Unsqueeze_484_output_0", "/Unsqueeze_485_output_0", "/Concat_197_output_0", "/Reshape_138_output_0", "/Reshape_143_output_0", "/FakeLinear_63_output_0", "/Add_78_output_0", "/post_attention_layernorm_15/Mul_1_output_0", "/mlp/gate_proj_15/FakeLinear_output_0", "/mlp/act_fn_15/Mul_output_0", "/mlp/up_proj_15/FakeLinear_output_0", "/mlp_15/Mul_output_0", "/mlp/down_proj_15/FakeLinear_output_0", "/Add_79_output_0", "/Reshape_144_output_0", "/input_layernorm_16/Mul_1_output_0", "/FakeLinear_64_output_0", "/Shape_224_output_0", "Shape6045", "BinaryOp6048", "BinaryOp6049", "Unsqueeze6050", "BinaryOp6052", "Unsqueeze6053", "StridedSlice6056", "BinaryOp6058", "BinaryOp6059", "/Gather_243_output_0", "/Unsqueeze_512_output_0", "Unsqueeze6067", "Unsqueeze6070", "StridedSlice6073", "Squeeze6074", "BinaryOp6075", "BinaryOp6076", "/Gather_244_output_0", "/Unsqueeze_513_output_0", "/Concat_208_output_0", "/Reshape_145_output_0", "/Mul_128_output_0", "/Shape_226_output_0", "Shape6177", "BinaryOp6180", "BinaryOp6181", "Unsqueeze6182", "BinaryOp6184", "Unsqueeze6185", "StridedSlice6188", "Squeeze6189", "BinaryOp6190", "BinaryOp6191", "/Gather_245_output_0", "/Div_48_output_0", "/Unsqueeze_519_output_0", "/Slice_65_output_0", "/Neg_32_output_0", "/Unsqueeze_518_output_0", "/Slice_64_output_0", "/Concat_211_output_0", "/Mul_129_output_0", "/Add_80_output_0", "/FakeLinear_65_output_0", "/Unsqueeze_514_output_0", "/Unsqueeze_515_output_0", "/Concat_209_output_0", "/Reshape_146_output_0", "/Mul_130_output_0", "/Shape_227_output_0", "Shape6083", "BinaryOp6086", "BinaryOp6087", "Unsqueeze6088", "BinaryOp6090", "Unsqueeze6091", "StridedSlice6094", "Squeeze6095", "BinaryOp6096", "BinaryOp6097", "/Gather_246_output_0", "/Div_49_output_0", "/Unsqueeze_521_output_0", "/Slice_67_output_0", "/Neg_33_output_0", "/Unsqueeze_520_output_0", "/Slice_66_output_0", "/Concat_212_output_0", "/Mul_131_output_0", "/Add_81_output_0", "/FakeLinear_66_output_0", "/Unsqueeze_516_output_0", "/Unsqueeze_517_output_0", "/Concat_210_output_0", "/Reshape_147_output_0", "/Reshape_152_output_0", "/FakeLinear_67_output_0", "/Add_83_output_0", "/post_attention_layernorm_16/Mul_1_output_0", "/mlp/gate_proj_16/FakeLinear_output_0", "/mlp/act_fn_16/Mul_output_0", "/mlp/up_proj_16/FakeLinear_output_0", "/mlp_16/Mul_output_0", "/mlp/down_proj_16/FakeLinear_output_0", "/Add_84_output_0", "/Reshape_153_output_0", "/input_layernorm_17/Mul_1_output_0", "/FakeLinear_68_output_0", "/Shape_238_output_0", "Shape6416", "BinaryOp6419", "BinaryOp6420", "Unsqueeze6421", "BinaryOp6423", "Unsqueeze6424", "StridedSlice6427", "BinaryOp6429", "BinaryOp6430", "/Gather_258_output_0", "/Unsqueeze_544_output_0", "Unsqueeze6438", "Unsqueeze6441", "StridedSlice6444", "Squeeze6445", "BinaryOp6446", "BinaryOp6447", "/Gather_259_output_0", "/Unsqueeze_545_output_0", "/Concat_221_output_0", "/Reshape_154_output_0", "/Mul_136_output_0", "/Shape_240_output_0", "Shape6548", "BinaryOp6551", "BinaryOp6552", "Unsqueeze6553", "BinaryOp6555", "Unsqueeze6556", "StridedSlice6559", "Squeeze6560", "BinaryOp6561", "BinaryOp6562", "/Gather_260_output_0", "/Div_51_output_0", "/Unsqueeze_551_output_0", "/Slice_69_output_0", "/Neg_34_output_0", "/Unsqueeze_550_output_0", "/Slice_68_output_0", "/Concat_224_output_0", "/Mul_137_output_0", "/Add_85_output_0", "/FakeLinear_69_output_0", "/Unsqueeze_546_output_0", "/Unsqueeze_547_output_0", "/Concat_222_output_0", "/Reshape_155_output_0", "/Mul_138_output_0", "/Shape_241_output_0", "Shape6454", "BinaryOp6457", "BinaryOp6458", "Unsqueeze6459", "BinaryOp6461", "Unsqueeze6462", "StridedSlice6465", "Squeeze6466", "BinaryOp6467", "BinaryOp6468", "/Gather_261_output_0", "/Div_52_output_0", "/Unsqueeze_553_output_0", "/Slice_71_output_0", "/Neg_35_output_0", "/Unsqueeze_552_output_0", "/Slice_70_output_0", "/Concat_225_output_0", "/Mul_139_output_0", "/Add_86_output_0", "/FakeLinear_70_output_0", "/Unsqueeze_548_output_0", "/Unsqueeze_549_output_0", "/Concat_223_output_0", "/Reshape_156_output_0", "/Reshape_161_output_0", "/FakeLinear_71_output_0", "/Add_88_output_0", "/post_attention_layernorm_17/Mul_1_output_0", "/mlp/gate_proj_17/FakeLinear_output_0", "/mlp/act_fn_17/Mul_output_0", "/mlp/up_proj_17/FakeLinear_output_0", "/mlp_17/Mul_output_0", "/mlp/down_proj_17/FakeLinear_output_0", "/Add_89_output_0", "/Reshape_162_output_0", "/input_layernorm_18/Mul_1_output_0", "/FakeLinear_72_output_0", "/Shape_252_output_0", "Shape6787", "BinaryOp6790", "BinaryOp6791", "Unsqueeze6792", "BinaryOp6794", "Unsqueeze6795", "StridedSlice6798", "BinaryOp6800", "BinaryOp6801", "/Gather_273_output_0", "/Unsqueeze_576_output_0", "Unsqueeze6809", "Unsqueeze6812", "StridedSlice6815", "Squeeze6816", "BinaryOp6817", "BinaryOp6818", "/Gather_274_output_0", "/Unsqueeze_577_output_0", "/Concat_234_output_0", "/Reshape_163_output_0", "/Mul_144_output_0", "/Shape_254_output_0", "Shape6919", "BinaryOp6922", "BinaryOp6923", "Unsqueeze6924", "BinaryOp6926", "Unsqueeze6927", "StridedSlice6930", "Squeeze6931", "BinaryOp6932", "BinaryOp6933", "/Gather_275_output_0", "/Div_54_output_0", "/Unsqueeze_583_output_0", "/Slice_73_output_0", "/Neg_36_output_0", "/Unsqueeze_582_output_0", "/Slice_72_output_0", "/Concat_237_output_0", "/Mul_145_output_0", "/Add_90_output_0", "/FakeLinear_73_output_0", "/Unsqueeze_578_output_0", "/Unsqueeze_579_output_0", "/Concat_235_output_0", "/Reshape_164_output_0", "/Mul_146_output_0", "/Shape_255_output_0", "Shape6825", "BinaryOp6828", "BinaryOp6829", "Unsqueeze6830", "BinaryOp6832", "Unsqueeze6833", "StridedSlice6836", "Squeeze6837", "BinaryOp6838", "BinaryOp6839", "/Gather_276_output_0", "/Div_55_output_0", "/Unsqueeze_585_output_0", "/Slice_75_output_0", "/Neg_37_output_0", "/Unsqueeze_584_output_0", "/Slice_74_output_0", "/Concat_238_output_0", "/Mul_147_output_0", "/Add_91_output_0", "/FakeLinear_74_output_0", "/Unsqueeze_580_output_0", "/Unsqueeze_581_output_0", "/Concat_236_output_0", "/Reshape_165_output_0", "/Reshape_170_output_0", "/FakeLinear_75_output_0", "/Add_93_output_0", "/post_attention_layernorm_18/Mul_1_output_0", "/mlp/gate_proj_18/FakeLinear_output_0", "/mlp/act_fn_18/Mul_output_0", "/mlp/up_proj_18/FakeLinear_output_0", "/mlp_18/Mul_output_0", "/mlp/down_proj_18/FakeLinear_output_0", "/Add_94_output_0", "/Reshape_171_output_0", "/input_layernorm_19/Mul_1_output_0", "/FakeLinear_76_output_0", "/Shape_266_output_0", "Shape7158", "BinaryOp7161", "BinaryOp7162", "Unsqueeze7163", "BinaryOp7165", "Unsqueeze7166", "StridedSlice7169", "BinaryOp7171", "BinaryOp7172", "/Gather_288_output_0", "/Unsqueeze_608_output_0", "Unsqueeze7180", "Unsqueeze7183", "StridedSlice7186", "Squeeze7187", "BinaryOp7188", "BinaryOp7189", "/Gather_289_output_0", "/Unsqueeze_609_output_0", "/Concat_247_output_0", "/Reshape_172_output_0", "/Mul_152_output_0", "/Shape_268_output_0", "Shape7290", "BinaryOp7293", "BinaryOp7294", "Unsqueeze7295", "BinaryOp7297", "Unsqueeze7298", "StridedSlice7301", "Squeeze7302", "BinaryOp7303", "BinaryOp7304", "/Gather_290_output_0", "/Div_57_output_0", "/Unsqueeze_615_output_0", "/Slice_77_output_0", "/Neg_38_output_0", "/Unsqueeze_614_output_0", "/Slice_76_output_0", "/Concat_250_output_0", "/Mul_153_output_0", "/Add_95_output_0", "/FakeLinear_77_output_0", "/Unsqueeze_610_output_0", "/Unsqueeze_611_output_0", "/Concat_248_output_0", "/Reshape_173_output_0", "/Mul_154_output_0", "/Shape_269_output_0", "Shape7196", "BinaryOp7199", "BinaryOp7200", "Unsqueeze7201", "BinaryOp7203", "Unsqueeze7204", "StridedSlice7207", "Squeeze7208", "BinaryOp7209", "BinaryOp7210", "/Gather_291_output_0", "/Div_58_output_0", "/Unsqueeze_617_output_0", "/Slice_79_output_0", "/Neg_39_output_0", "/Unsqueeze_616_output_0", "/Slice_78_output_0", "/Concat_251_output_0", "/Mul_155_output_0", "/Add_96_output_0", "/FakeLinear_78_output_0", "/Unsqueeze_612_output_0", "/Unsqueeze_613_output_0", "/Concat_249_output_0", "/Reshape_174_output_0", "/Reshape_179_output_0", "/FakeLinear_79_output_0", "/Add_98_output_0", "/post_attention_layernorm_19/Mul_1_output_0", "/mlp/gate_proj_19/FakeLinear_output_0", "/mlp/act_fn_19/Mul_output_0", "/mlp/up_proj_19/FakeLinear_output_0", "/mlp_19/Mul_output_0", "/mlp/down_proj_19/FakeLinear_output_0", "/Add_99_output_0", "/Reshape_180_output_0", "/input_layernorm_20/Mul_1_output_0", "/FakeLinear_80_output_0", "/Shape_280_output_0", "Shape7529", "BinaryOp7532", "BinaryOp7533", "Unsqueeze7534", "BinaryOp7536", "Unsqueeze7537", "StridedSlice7540", "BinaryOp7542", "BinaryOp7543", "/Gather_303_output_0", "/Unsqueeze_640_output_0", "Unsqueeze7551", "Unsqueeze7554", "StridedSlice7557", "Squeeze7558", "BinaryOp7559", "BinaryOp7560", "/Gather_304_output_0", "/Unsqueeze_641_output_0", "/Concat_260_output_0", "/Reshape_181_output_0", "/Mul_160_output_0", "/Shape_282_output_0", "Shape7661", "BinaryOp7664", "BinaryOp7665", "Unsqueeze7666", "BinaryOp7668", "Unsqueeze7669", "StridedSlice7672", "Squeeze7673", "BinaryOp7674", "BinaryOp7675", "/Gather_305_output_0", "/Div_60_output_0", "/Unsqueeze_647_output_0", "/Slice_81_output_0", "/Neg_40_output_0", "/Unsqueeze_646_output_0", "/Slice_80_output_0", "/Concat_263_output_0", "/Mul_161_output_0", "/Add_100_output_0", "/FakeLinear_81_output_0", "/Unsqueeze_642_output_0", "/Unsqueeze_643_output_0", "/Concat_261_output_0", "/Reshape_182_output_0", "/Mul_162_output_0", "/Shape_283_output_0", "Shape7567", "BinaryOp7570", "BinaryOp7571", "Unsqueeze7572", "BinaryOp7574", "Unsqueeze7575", "StridedSlice7578", "Squeeze7579", "BinaryOp7580", "BinaryOp7581", "/Gather_306_output_0", "/Div_61_output_0", "/Unsqueeze_649_output_0", "/Slice_83_output_0", "/Neg_41_output_0", "/Unsqueeze_648_output_0", "/Slice_82_output_0", "/Concat_264_output_0", "/Mul_163_output_0", "/Add_101_output_0", "/FakeLinear_82_output_0", "/Unsqueeze_644_output_0", "/Unsqueeze_645_output_0", "/Concat_262_output_0", "/Reshape_183_output_0", "/Reshape_188_output_0", "/FakeLinear_83_output_0", "/Add_103_output_0", "/post_attention_layernorm_20/Mul_1_output_0", "/mlp/gate_proj_20/FakeLinear_output_0", "/mlp/act_fn_20/Mul_output_0", "/mlp/up_proj_20/FakeLinear_output_0", "/mlp_20/Mul_output_0", "/mlp/down_proj_20/FakeLinear_output_0", "/Add_104_output_0", "/Reshape_189_output_0", "/input_layernorm_21/Mul_1_output_0", "/FakeLinear_84_output_0", "/Shape_294_output_0", "Shape7900", "BinaryOp7903", "BinaryOp7904", "Unsqueeze7905", "BinaryOp7907", "Unsqueeze7908", "StridedSlice7911", "BinaryOp7913", "BinaryOp7914", "/Gather_318_output_0", "/Unsqueeze_672_output_0", "Unsqueeze7922", "Unsqueeze7925", "StridedSlice7928", "Squeeze7929", "BinaryOp7930", "BinaryOp7931", "/Gather_319_output_0", "/Unsqueeze_673_output_0", "/Concat_273_output_0", "/Reshape_190_output_0", "/Mul_168_output_0", "/Shape_296_output_0", "Shape8032", "BinaryOp8035", "BinaryOp8036", "Unsqueeze8037", "BinaryOp8039", "Unsqueeze8040", "StridedSlice8043", "Squeeze8044", "BinaryOp8045", "BinaryOp8046", "/Gather_320_output_0", "/Div_63_output_0", "/Unsqueeze_679_output_0", "/Slice_85_output_0", "/Neg_42_output_0", "/Unsqueeze_678_output_0", "/Slice_84_output_0", "/Concat_276_output_0", "/Mul_169_output_0", "/Add_105_output_0", "/FakeLinear_85_output_0", "/Unsqueeze_674_output_0", "/Unsqueeze_675_output_0", "/Concat_274_output_0", "/Reshape_191_output_0", "/Mul_170_output_0", "/Shape_297_output_0", "Shape7938", "BinaryOp7941", "BinaryOp7942", "Unsqueeze7943", "BinaryOp7945", "Unsqueeze7946", "StridedSlice7949", "Squeeze7950", "BinaryOp7951", "BinaryOp7952", "/Gather_321_output_0", "/Div_64_output_0", "/Unsqueeze_681_output_0", "/Slice_87_output_0", "/Neg_43_output_0", "/Unsqueeze_680_output_0", "/Slice_86_output_0", "/Concat_277_output_0", "/Mul_171_output_0", "/Add_106_output_0", "/FakeLinear_86_output_0", "/Unsqueeze_676_output_0", "/Unsqueeze_677_output_0", "/Concat_275_output_0", "/Reshape_192_output_0", "/Reshape_197_output_0", "/FakeLinear_87_output_0", "/Add_108_output_0", "/post_attention_layernorm_21/Mul_1_output_0", "/mlp/gate_proj_21/FakeLinear_output_0", "/mlp/act_fn_21/Mul_output_0", "/mlp/up_proj_21/FakeLinear_output_0", "/mlp_21/Mul_output_0", "/mlp/down_proj_21/FakeLinear_output_0", "/Add_109_output_0", "/Reshape_198_output_0", "/input_layernorm_22/Mul_1_output_0", "/FakeLinear_88_output_0", "/Shape_308_output_0", "Shape8271", "BinaryOp8274", "BinaryOp8275", "Unsqueeze8276", "BinaryOp8278", "Unsqueeze8279", "StridedSlice8282", "BinaryOp8284", "BinaryOp8285", "/Gather_333_output_0", "/Unsqueeze_704_output_0", "Unsqueeze8293", "Unsqueeze8296", "StridedSlice8299", "Squeeze8300", "BinaryOp8301", "BinaryOp8302", "/Gather_334_output_0", "/Unsqueeze_705_output_0", "/Concat_286_output_0", "/Reshape_199_output_0", "/Mul_176_output_0", "/Shape_310_output_0", "Shape8403", "BinaryOp8406", "BinaryOp8407", "Unsqueeze8408", "BinaryOp8410", "Unsqueeze8411", "StridedSlice8414", "Squeeze8415", "BinaryOp8416", "BinaryOp8417", "/Gather_335_output_0", "/Div_66_output_0", "/Unsqueeze_711_output_0", "/Slice_89_output_0", "/Neg_44_output_0", "/Unsqueeze_710_output_0", "/Slice_88_output_0", "/Concat_289_output_0", "/Mul_177_output_0", "/Add_110_output_0", "/FakeLinear_89_output_0", "/Unsqueeze_706_output_0", "/Unsqueeze_707_output_0", "/Concat_287_output_0", "/Reshape_200_output_0", "/Mul_178_output_0", "/Shape_311_output_0", "Shape8309", "BinaryOp8312", "BinaryOp8313", "Unsqueeze8314", "BinaryOp8316", "Unsqueeze8317", "StridedSlice8320", "Squeeze8321", "BinaryOp8322", "BinaryOp8323", "/Gather_336_output_0", "/Div_67_output_0", "/Unsqueeze_713_output_0", "/Slice_91_output_0", "/Neg_45_output_0", "/Unsqueeze_712_output_0", "/Slice_90_output_0", "/Concat_290_output_0", "/Mul_179_output_0", "/Add_111_output_0", "/FakeLinear_90_output_0", "/Unsqueeze_708_output_0", "/Unsqueeze_709_output_0", "/Concat_288_output_0", "/Reshape_201_output_0", "/Reshape_206_output_0", "/FakeLinear_91_output_0", "/Add_113_output_0", "/post_attention_layernorm_22/Mul_1_output_0", "/mlp/gate_proj_22/FakeLinear_output_0", "/mlp/act_fn_22/Mul_output_0", "/mlp/up_proj_22/FakeLinear_output_0", "/mlp_22/Mul_output_0", "/mlp/down_proj_22/FakeLinear_output_0", "/Add_114_output_0", "/Reshape_207_output_0", "/input_layernorm_23/Mul_1_output_0", "/FakeLinear_92_output_0", "/Shape_322_output_0", "Shape8642", "BinaryOp8645", "BinaryOp8646", "Unsqueeze8647", "BinaryOp8649", "Unsqueeze8650", "StridedSlice8653", "BinaryOp8655", "BinaryOp8656", "/Gather_348_output_0", "/Unsqueeze_736_output_0", "Unsqueeze8664", "Unsqueeze8667", "StridedSlice8670", "Squeeze8671", "BinaryOp8672", "BinaryOp8673", "/Gather_349_output_0", "/Unsqueeze_737_output_0", "/Concat_299_output_0", "/Reshape_208_output_0", "/Mul_184_output_0", "/Shape_324_output_0", "Shape8742", "BinaryOp8745", "BinaryOp8746", "Unsqueeze8747", "BinaryOp8749", "Unsqueeze8750", "StridedSlice8753", "Squeeze8754", "BinaryOp8755", "BinaryOp8756", "/Gather_350_output_0", "/Div_69_output_0", "/Unsqueeze_743_output_0", "/Slice_93_output_0", "/Neg_46_output_0", "/Unsqueeze_742_output_0", "/Slice_92_output_0", "/Concat_302_output_0", "/Mul_185_output_0", "/Add_115_output_0", "/FakeLinear_93_output_0", "/Unsqueeze_738_output_0", "/Unsqueeze_739_output_0", "/Concat_300_output_0", "/Reshape_209_output_0", "/Mul_186_output_0", "/Shape_325_output_0", "Shape8680", "BinaryOp8683", "BinaryOp8684", "Unsqueeze8685", "BinaryOp8687", "Unsqueeze8688", "StridedSlice8691", "Squeeze8692", "BinaryOp8693", "BinaryOp8694", "/Gather_351_output_0", "/Div_70_output_0", "/Unsqueeze_745_output_0", "/Slice_95_output_0", "/Neg_47_output_0", "/Unsqueeze_744_output_0", "/Slice_94_output_0", "/Concat_303_output_0", "/Mul_187_output_0", "/Add_116_output_0", "/FakeLinear_94_output_0", "/Unsqueeze_740_output_0", "/Unsqueeze_741_output_0", "/Concat_301_output_0", "/Reshape_210_output_0", "/Reshape_215_output_0", "/FakeLinear_95_output_0", "/Add_118_output_0", "/post_attention_layernorm_23/Mul_1_output_0", "/mlp/gate_proj_23/FakeLinear_output_0", "/mlp/act_fn_23/Mul_output_0", "/mlp/up_proj_23/FakeLinear_output_0", "/mlp_23/Mul_output_0", "/mlp/down_proj_23/FakeLinear_output_0", "/Add_119_output_0", "logits_index", "/lm/Slice_output_0", "/lm/norm/Mul_1_output_0", "logits", "/layers.0/self_attn/q_proj/Linear/pre_reshape", "/layers.0/self_attn/q_proj/Linear/pre_convert", "/layers.0/self_attn/q_proj/Linear", "/layers.0/self_attn/q_proj/Linear/post_convert", "/layers.0/self_attn/k_proj/Linear/pre_reshape", "/layers.0/self_attn/k_proj/Linear/pre_convert", "/layers.0/self_attn/k_proj/Linear", "/layers.0/self_attn/k_proj/Linear/post_convert", "/layers.0/self_attn/v_proj/Linear/pre_reshape", "/layers.0/self_attn/v_proj/Linear/pre_convert", "/layers.0/self_attn/v_proj/Linear", "/layers.0/self_attn/v_proj/Linear/post_convert", "/layers.0/self_attn/o_proj/Linear/pre_reshape", "/layers.0/self_attn/o_proj/Linear/pre_convert", "/layers.0/self_attn/o_proj/Linear", "/layers.0/self_attn/o_proj/Linear/post_convert", "/layers.0/mlp/gate_proj/Linear/pre_reshape", "/layers.0/mlp/gate_proj/Linear/pre_convert", "/layers.0/mlp/gate_proj/Linear", "/layers.0/mlp/gate_proj/Linear/post_convert", "/layers.0/mlp/up_proj/Linear/pre_reshape", "/layers.0/mlp/up_proj/Linear/pre_convert", "/layers.0/mlp/up_proj/Linear", "/layers.0/mlp/up_proj/Linear/post_convert", "/layers.0/mlp/down_proj/Linear/pre_reshape", "/layers.0/mlp/down_proj/Linear/pre_convert", "/layers.0/mlp/down_proj/Linear", "/layers.0/mlp/down_proj/Linear/post_convert", "/layers.1/self_attn/q_proj/Linear/pre_reshape", "/layers.1/self_attn/q_proj/Linear/pre_convert", "/layers.1/self_attn/q_proj/Linear", "/layers.1/self_attn/q_proj/Linear/post_convert", "/layers.1/self_attn/k_proj/Linear/pre_reshape", "/layers.1/self_attn/k_proj/Linear/pre_convert", "/layers.1/self_attn/k_proj/Linear", "/layers.1/self_attn/k_proj/Linear/post_convert", "/layers.1/self_attn/v_proj/Linear/pre_reshape", "/layers.1/self_attn/v_proj/Linear/pre_convert", "/layers.1/self_attn/v_proj/Linear", "/layers.1/self_attn/v_proj/Linear/post_convert", "/layers.1/self_attn/o_proj/Linear/pre_reshape", "/layers.1/self_attn/o_proj/Linear/pre_convert", "/layers.1/self_attn/o_proj/Linear", "/layers.1/self_attn/o_proj/Linear/post_convert", "/layers.1/mlp/gate_proj/Linear/pre_reshape", "/layers.1/mlp/gate_proj/Linear/pre_convert", "/layers.1/mlp/gate_proj/Linear", "/layers.1/mlp/gate_proj/Linear/post_convert", "/layers.1/mlp/up_proj/Linear/pre_reshape", "/layers.1/mlp/up_proj/Linear/pre_convert", "/layers.1/mlp/up_proj/Linear", "/layers.1/mlp/up_proj/Linear/post_convert", "/layers.1/mlp/down_proj/Linear/pre_reshape", "/layers.1/mlp/down_proj/Linear/pre_convert", "/layers.1/mlp/down_proj/Linear", "/layers.1/mlp/down_proj/Linear/post_convert", "/layers.2/self_attn/q_proj/Linear/pre_reshape", "/layers.2/self_attn/q_proj/Linear/pre_convert", "/layers.2/self_attn/q_proj/Linear", "/layers.2/self_attn/q_proj/Linear/post_convert", "/layers.2/self_attn/k_proj/Linear/pre_reshape", "/layers.2/self_attn/k_proj/Linear/pre_convert", "/layers.2/self_attn/k_proj/Linear", "/layers.2/self_attn/k_proj/Linear/post_convert", "/layers.2/self_attn/v_proj/Linear/pre_reshape", "/layers.2/self_attn/v_proj/Linear/pre_convert", "/layers.2/self_attn/v_proj/Linear", "/layers.2/self_attn/v_proj/Linear/post_convert", "/layers.2/self_attn/o_proj/Linear/pre_reshape", "/layers.2/self_attn/o_proj/Linear/pre_convert", "/layers.2/self_attn/o_proj/Linear", "/layers.2/self_attn/o_proj/Linear/post_convert", "/layers.2/mlp/gate_proj/Linear/pre_reshape", "/layers.2/mlp/gate_proj/Linear/pre_convert", "/layers.2/mlp/gate_proj/Linear", "/layers.2/mlp/gate_proj/Linear/post_convert", "/layers.2/mlp/up_proj/Linear/pre_reshape", "/layers.2/mlp/up_proj/Linear/pre_convert", "/layers.2/mlp/up_proj/Linear", "/layers.2/mlp/up_proj/Linear/post_convert", "/layers.2/mlp/down_proj/Linear/pre_reshape", "/layers.2/mlp/down_proj/Linear/pre_convert", "/layers.2/mlp/down_proj/Linear", "/layers.2/mlp/down_proj/Linear/post_convert", "/layers.3/self_attn/q_proj/Linear/pre_reshape", "/layers.3/self_attn/q_proj/Linear/pre_convert", "/layers.3/self_attn/q_proj/Linear", "/layers.3/self_attn/q_proj/Linear/post_convert", "/layers.3/self_attn/k_proj/Linear/pre_reshape", "/layers.3/self_attn/k_proj/Linear/pre_convert", "/layers.3/self_attn/k_proj/Linear", "/layers.3/self_attn/k_proj/Linear/post_convert", "/layers.3/self_attn/v_proj/Linear/pre_reshape", "/layers.3/self_attn/v_proj/Linear/pre_convert", "/layers.3/self_attn/v_proj/Linear", "/layers.3/self_attn/v_proj/Linear/post_convert", "/layers.3/self_attn/o_proj/Linear/pre_reshape", "/layers.3/self_attn/o_proj/Linear/pre_convert", "/layers.3/self_attn/o_proj/Linear", "/layers.3/self_attn/o_proj/Linear/post_convert", "/layers.3/mlp/gate_proj/Linear/pre_reshape", "/layers.3/mlp/gate_proj/Linear/pre_convert", "/layers.3/mlp/gate_proj/Linear", "/layers.3/mlp/gate_proj/Linear/post_convert", "/layers.3/mlp/up_proj/Linear/pre_reshape", "/layers.3/mlp/up_proj/Linear/pre_convert", "/layers.3/mlp/up_proj/Linear", "/layers.3/mlp/up_proj/Linear/post_convert", "/layers.3/mlp/down_proj/Linear/pre_reshape", "/layers.3/mlp/down_proj/Linear/pre_convert", "/layers.3/mlp/down_proj/Linear", "/layers.3/mlp/down_proj/Linear/post_convert", "/layers.4/self_attn/q_proj/Linear/pre_reshape", "/layers.4/self_attn/q_proj/Linear/pre_convert", "/layers.4/self_attn/q_proj/Linear", "/layers.4/self_attn/q_proj/Linear/post_convert", "/layers.4/self_attn/k_proj/Linear/pre_reshape", "/layers.4/self_attn/k_proj/Linear/pre_convert", "/layers.4/self_attn/k_proj/Linear", "/layers.4/self_attn/k_proj/Linear/post_convert", "/layers.4/self_attn/v_proj/Linear/pre_reshape", "/layers.4/self_attn/v_proj/Linear/pre_convert", "/layers.4/self_attn/v_proj/Linear", "/layers.4/self_attn/v_proj/Linear/post_convert", "/layers.4/self_attn/o_proj/Linear/pre_reshape", "/layers.4/self_attn/o_proj/Linear/pre_convert", "/layers.4/self_attn/o_proj/Linear", "/layers.4/self_attn/o_proj/Linear/post_convert", "/layers.4/mlp/gate_proj/Linear/pre_reshape", "/layers.4/mlp/gate_proj/Linear/pre_convert", "/layers.4/mlp/gate_proj/Linear", "/layers.4/mlp/gate_proj/Linear/post_convert", "/layers.4/mlp/up_proj/Linear/pre_reshape", "/layers.4/mlp/up_proj/Linear/pre_convert", "/layers.4/mlp/up_proj/Linear", "/layers.4/mlp/up_proj/Linear/post_convert", "/layers.4/mlp/down_proj/Linear/pre_reshape", "/layers.4/mlp/down_proj/Linear/pre_convert", "/layers.4/mlp/down_proj/Linear", "/layers.4/mlp/down_proj/Linear/post_convert", "/layers.5/self_attn/q_proj/Linear/pre_reshape", "/layers.5/self_attn/q_proj/Linear/pre_convert", "/layers.5/self_attn/q_proj/Linear", "/layers.5/self_attn/q_proj/Linear/post_convert", "/layers.5/self_attn/k_proj/Linear/pre_reshape", "/layers.5/self_attn/k_proj/Linear/pre_convert", "/layers.5/self_attn/k_proj/Linear", "/layers.5/self_attn/k_proj/Linear/post_convert", "/layers.5/self_attn/v_proj/Linear/pre_reshape", "/layers.5/self_attn/v_proj/Linear/pre_convert", "/layers.5/self_attn/v_proj/Linear", "/layers.5/self_attn/v_proj/Linear/post_convert", "/layers.5/self_attn/o_proj/Linear/pre_reshape", "/layers.5/self_attn/o_proj/Linear/pre_convert", "/layers.5/self_attn/o_proj/Linear", "/layers.5/self_attn/o_proj/Linear/post_convert", "/layers.5/mlp/gate_proj/Linear/pre_reshape", "/layers.5/mlp/gate_proj/Linear/pre_convert", "/layers.5/mlp/gate_proj/Linear", "/layers.5/mlp/gate_proj/Linear/post_convert", "/layers.5/mlp/up_proj/Linear/pre_reshape", "/layers.5/mlp/up_proj/Linear/pre_convert", "/layers.5/mlp/up_proj/Linear", "/layers.5/mlp/up_proj/Linear/post_convert", "/layers.5/mlp/down_proj/Linear/pre_reshape", "/layers.5/mlp/down_proj/Linear/pre_convert", "/layers.5/mlp/down_proj/Linear", "/layers.5/mlp/down_proj/Linear/post_convert", "/layers.6/self_attn/q_proj/Linear/pre_reshape", "/layers.6/self_attn/q_proj/Linear/pre_convert", "/layers.6/self_attn/q_proj/Linear", "/layers.6/self_attn/q_proj/Linear/post_convert", "/layers.6/self_attn/k_proj/Linear/pre_reshape", "/layers.6/self_attn/k_proj/Linear/pre_convert", "/layers.6/self_attn/k_proj/Linear", "/layers.6/self_attn/k_proj/Linear/post_convert", "/layers.6/self_attn/v_proj/Linear/pre_reshape", "/layers.6/self_attn/v_proj/Linear/pre_convert", "/layers.6/self_attn/v_proj/Linear", "/layers.6/self_attn/v_proj/Linear/post_convert", "/layers.6/self_attn/o_proj/Linear/pre_reshape", "/layers.6/self_attn/o_proj/Linear/pre_convert", "/layers.6/self_attn/o_proj/Linear", "/layers.6/self_attn/o_proj/Linear/post_convert", "/layers.6/mlp/gate_proj/Linear/pre_reshape", "/layers.6/mlp/gate_proj/Linear/pre_convert", "/layers.6/mlp/gate_proj/Linear", "/layers.6/mlp/gate_proj/Linear/post_convert", "/layers.6/mlp/up_proj/Linear/pre_reshape", "/layers.6/mlp/up_proj/Linear/pre_convert", "/layers.6/mlp/up_proj/Linear", "/layers.6/mlp/up_proj/Linear/post_convert", "/layers.6/mlp/down_proj/Linear/pre_reshape", "/layers.6/mlp/down_proj/Linear/pre_convert", "/layers.6/mlp/down_proj/Linear", "/layers.6/mlp/down_proj/Linear/post_convert", "/layers.7/self_attn/q_proj/Linear/pre_reshape", "/layers.7/self_attn/q_proj/Linear/pre_convert", "/layers.7/self_attn/q_proj/Linear", "/layers.7/self_attn/q_proj/Linear/post_convert", "/layers.7/self_attn/k_proj/Linear/pre_reshape", "/layers.7/self_attn/k_proj/Linear/pre_convert", "/layers.7/self_attn/k_proj/Linear", "/layers.7/self_attn/k_proj/Linear/post_convert", "/layers.7/self_attn/v_proj/Linear/pre_reshape", "/layers.7/self_attn/v_proj/Linear/pre_convert", "/layers.7/self_attn/v_proj/Linear", "/layers.7/self_attn/v_proj/Linear/post_convert", "/layers.7/self_attn/o_proj/Linear/pre_reshape", "/layers.7/self_attn/o_proj/Linear/pre_convert", "/layers.7/self_attn/o_proj/Linear", "/layers.7/self_attn/o_proj/Linear/post_convert", "/layers.7/mlp/gate_proj/Linear/pre_reshape", "/layers.7/mlp/gate_proj/Linear/pre_convert", "/layers.7/mlp/gate_proj/Linear", "/layers.7/mlp/gate_proj/Linear/post_convert", "/layers.7/mlp/up_proj/Linear/pre_reshape", "/layers.7/mlp/up_proj/Linear/pre_convert", "/layers.7/mlp/up_proj/Linear", "/layers.7/mlp/up_proj/Linear/post_convert", "/layers.7/mlp/down_proj/Linear/pre_reshape", "/layers.7/mlp/down_proj/Linear/pre_convert", "/layers.7/mlp/down_proj/Linear", "/layers.7/mlp/down_proj/Linear/post_convert", "/layers.8/self_attn/q_proj/Linear/pre_reshape", "/layers.8/self_attn/q_proj/Linear/pre_convert", "/layers.8/self_attn/q_proj/Linear", "/layers.8/self_attn/q_proj/Linear/post_convert", "/layers.8/self_attn/k_proj/Linear/pre_reshape", "/layers.8/self_attn/k_proj/Linear/pre_convert", "/layers.8/self_attn/k_proj/Linear", "/layers.8/self_attn/k_proj/Linear/post_convert", "/layers.8/self_attn/v_proj/Linear/pre_reshape", "/layers.8/self_attn/v_proj/Linear/pre_convert", "/layers.8/self_attn/v_proj/Linear", "/layers.8/self_attn/v_proj/Linear/post_convert", "/layers.8/self_attn/o_proj/Linear/pre_reshape", "/layers.8/self_attn/o_proj/Linear/pre_convert", "/layers.8/self_attn/o_proj/Linear", "/layers.8/self_attn/o_proj/Linear/post_convert", "/layers.8/mlp/gate_proj/Linear/pre_reshape", "/layers.8/mlp/gate_proj/Linear/pre_convert", "/layers.8/mlp/gate_proj/Linear", "/layers.8/mlp/gate_proj/Linear/post_convert", "/layers.8/mlp/up_proj/Linear/pre_reshape", "/layers.8/mlp/up_proj/Linear/pre_convert", "/layers.8/mlp/up_proj/Linear", "/layers.8/mlp/up_proj/Linear/post_convert", "/layers.8/mlp/down_proj/Linear/pre_reshape", "/layers.8/mlp/down_proj/Linear/pre_convert", "/layers.8/mlp/down_proj/Linear", "/layers.8/mlp/down_proj/Linear/post_convert", "/layers.9/self_attn/q_proj/Linear/pre_reshape", "/layers.9/self_attn/q_proj/Linear/pre_convert", "/layers.9/self_attn/q_proj/Linear", "/layers.9/self_attn/q_proj/Linear/post_convert", "/layers.9/self_attn/k_proj/Linear/pre_reshape", "/layers.9/self_attn/k_proj/Linear/pre_convert", "/layers.9/self_attn/k_proj/Linear", "/layers.9/self_attn/k_proj/Linear/post_convert", "/layers.9/self_attn/v_proj/Linear/pre_reshape", "/layers.9/self_attn/v_proj/Linear/pre_convert", "/layers.9/self_attn/v_proj/Linear", "/layers.9/self_attn/v_proj/Linear/post_convert", "/layers.9/self_attn/o_proj/Linear/pre_reshape", "/layers.9/self_attn/o_proj/Linear/pre_convert", "/layers.9/self_attn/o_proj/Linear", "/layers.9/self_attn/o_proj/Linear/post_convert", "/layers.9/mlp/gate_proj/Linear/pre_reshape", "/layers.9/mlp/gate_proj/Linear/pre_convert", "/layers.9/mlp/gate_proj/Linear", "/layers.9/mlp/gate_proj/Linear/post_convert", "/layers.9/mlp/up_proj/Linear/pre_reshape", "/layers.9/mlp/up_proj/Linear/pre_convert", "/layers.9/mlp/up_proj/Linear", "/layers.9/mlp/up_proj/Linear/post_convert", "/layers.9/mlp/down_proj/Linear/pre_reshape", "/layers.9/mlp/down_proj/Linear/pre_convert", "/layers.9/mlp/down_proj/Linear", "/layers.9/mlp/down_proj/Linear/post_convert", "/layers.10/self_attn/q_proj/Linear/pre_reshape", "/layers.10/self_attn/q_proj/Linear/pre_convert", "/layers.10/self_attn/q_proj/Linear", "/layers.10/self_attn/q_proj/Linear/post_convert", "/layers.10/self_attn/k_proj/Linear/pre_reshape", "/layers.10/self_attn/k_proj/Linear/pre_convert", "/layers.10/self_attn/k_proj/Linear", "/layers.10/self_attn/k_proj/Linear/post_convert", "/layers.10/self_attn/v_proj/Linear/pre_reshape", "/layers.10/self_attn/v_proj/Linear/pre_convert", "/layers.10/self_attn/v_proj/Linear", "/layers.10/self_attn/v_proj/Linear/post_convert", "/layers.10/self_attn/o_proj/Linear/pre_reshape", "/layers.10/self_attn/o_proj/Linear/pre_convert", "/layers.10/self_attn/o_proj/Linear", "/layers.10/self_attn/o_proj/Linear/post_convert", "/layers.10/mlp/gate_proj/Linear/pre_reshape", "/layers.10/mlp/gate_proj/Linear/pre_convert", "/layers.10/mlp/gate_proj/Linear", "/layers.10/mlp/gate_proj/Linear/post_convert", "/layers.10/mlp/up_proj/Linear/pre_reshape", "/layers.10/mlp/up_proj/Linear/pre_convert", "/layers.10/mlp/up_proj/Linear", "/layers.10/mlp/up_proj/Linear/post_convert", "/layers.10/mlp/down_proj/Linear/pre_reshape", "/layers.10/mlp/down_proj/Linear/pre_convert", "/layers.10/mlp/down_proj/Linear", "/layers.10/mlp/down_proj/Linear/post_convert", "/layers.11/self_attn/q_proj/Linear/pre_reshape", "/layers.11/self_attn/q_proj/Linear/pre_convert", "/layers.11/self_attn/q_proj/Linear", "/layers.11/self_attn/q_proj/Linear/post_convert", "/layers.11/self_attn/k_proj/Linear/pre_reshape", "/layers.11/self_attn/k_proj/Linear/pre_convert", "/layers.11/self_attn/k_proj/Linear", "/layers.11/self_attn/k_proj/Linear/post_convert", "/layers.11/self_attn/v_proj/Linear/pre_reshape", "/layers.11/self_attn/v_proj/Linear/pre_convert", "/layers.11/self_attn/v_proj/Linear", "/layers.11/self_attn/v_proj/Linear/post_convert", "/layers.11/self_attn/o_proj/Linear/pre_reshape", "/layers.11/self_attn/o_proj/Linear/pre_convert", "/layers.11/self_attn/o_proj/Linear", "/layers.11/self_attn/o_proj/Linear/post_convert", "/layers.11/mlp/gate_proj/Linear/pre_reshape", "/layers.11/mlp/gate_proj/Linear/pre_convert", "/layers.11/mlp/gate_proj/Linear", "/layers.11/mlp/gate_proj/Linear/post_convert", "/layers.11/mlp/up_proj/Linear/pre_reshape", "/layers.11/mlp/up_proj/Linear/pre_convert", "/layers.11/mlp/up_proj/Linear", "/layers.11/mlp/up_proj/Linear/post_convert", "/layers.11/mlp/down_proj/Linear/pre_reshape", "/layers.11/mlp/down_proj/Linear/pre_convert", "/layers.11/mlp/down_proj/Linear", "/layers.11/mlp/down_proj/Linear/post_convert", "/layers.12/self_attn/q_proj/Linear/pre_reshape", "/layers.12/self_attn/q_proj/Linear/pre_convert", "/layers.12/self_attn/q_proj/Linear", "/layers.12/self_attn/q_proj/Linear/post_convert", "/layers.12/self_attn/k_proj/Linear/pre_reshape", "/layers.12/self_attn/k_proj/Linear/pre_convert", "/layers.12/self_attn/k_proj/Linear", "/layers.12/self_attn/k_proj/Linear/post_convert", "/layers.12/self_attn/v_proj/Linear/pre_reshape", "/layers.12/self_attn/v_proj/Linear/pre_convert", "/layers.12/self_attn/v_proj/Linear", "/layers.12/self_attn/v_proj/Linear/post_convert", "/layers.12/self_attn/o_proj/Linear/pre_reshape", "/layers.12/self_attn/o_proj/Linear/pre_convert", "/layers.12/self_attn/o_proj/Linear", "/layers.12/self_attn/o_proj/Linear/post_convert", "/layers.12/mlp/gate_proj/Linear/pre_reshape", "/layers.12/mlp/gate_proj/Linear/pre_convert", "/layers.12/mlp/gate_proj/Linear", "/layers.12/mlp/gate_proj/Linear/post_convert", "/layers.12/mlp/up_proj/Linear/pre_reshape", "/layers.12/mlp/up_proj/Linear/pre_convert", "/layers.12/mlp/up_proj/Linear", "/layers.12/mlp/up_proj/Linear/post_convert", "/layers.12/mlp/down_proj/Linear/pre_reshape", "/layers.12/mlp/down_proj/Linear/pre_convert", "/layers.12/mlp/down_proj/Linear", "/layers.12/mlp/down_proj/Linear/post_convert", "/layers.13/self_attn/q_proj/Linear/pre_reshape", "/layers.13/self_attn/q_proj/Linear/pre_convert", "/layers.13/self_attn/q_proj/Linear", "/layers.13/self_attn/q_proj/Linear/post_convert", "/layers.13/self_attn/k_proj/Linear/pre_reshape", "/layers.13/self_attn/k_proj/Linear/pre_convert", "/layers.13/self_attn/k_proj/Linear", "/layers.13/self_attn/k_proj/Linear/post_convert", "/layers.13/self_attn/v_proj/Linear/pre_reshape", "/layers.13/self_attn/v_proj/Linear/pre_convert", "/layers.13/self_attn/v_proj/Linear", "/layers.13/self_attn/v_proj/Linear/post_convert", "/layers.13/self_attn/o_proj/Linear/pre_reshape", "/layers.13/self_attn/o_proj/Linear/pre_convert", "/layers.13/self_attn/o_proj/Linear", "/layers.13/self_attn/o_proj/Linear/post_convert", "/layers.13/mlp/gate_proj/Linear/pre_reshape", "/layers.13/mlp/gate_proj/Linear/pre_convert", "/layers.13/mlp/gate_proj/Linear", "/layers.13/mlp/gate_proj/Linear/post_convert", "/layers.13/mlp/up_proj/Linear/pre_reshape", "/layers.13/mlp/up_proj/Linear/pre_convert", "/layers.13/mlp/up_proj/Linear", "/layers.13/mlp/up_proj/Linear/post_convert", "/layers.13/mlp/down_proj/Linear/pre_reshape", "/layers.13/mlp/down_proj/Linear/pre_convert", "/layers.13/mlp/down_proj/Linear", "/layers.13/mlp/down_proj/Linear/post_convert", "/layers.14/self_attn/q_proj/Linear/pre_reshape", "/layers.14/self_attn/q_proj/Linear/pre_convert", "/layers.14/self_attn/q_proj/Linear", "/layers.14/self_attn/q_proj/Linear/post_convert", "/layers.14/self_attn/k_proj/Linear/pre_reshape", "/layers.14/self_attn/k_proj/Linear/pre_convert", "/layers.14/self_attn/k_proj/Linear", "/layers.14/self_attn/k_proj/Linear/post_convert", "/layers.14/self_attn/v_proj/Linear/pre_reshape", "/layers.14/self_attn/v_proj/Linear/pre_convert", "/layers.14/self_attn/v_proj/Linear", "/layers.14/self_attn/v_proj/Linear/post_convert", "/layers.14/self_attn/o_proj/Linear/pre_reshape", "/layers.14/self_attn/o_proj/Linear/pre_convert", "/layers.14/self_attn/o_proj/Linear", "/layers.14/self_attn/o_proj/Linear/post_convert", "/layers.14/mlp/gate_proj/Linear/pre_reshape", "/layers.14/mlp/gate_proj/Linear/pre_convert", "/layers.14/mlp/gate_proj/Linear", "/layers.14/mlp/gate_proj/Linear/post_convert", "/layers.14/mlp/up_proj/Linear/pre_reshape", "/layers.14/mlp/up_proj/Linear/pre_convert", "/layers.14/mlp/up_proj/Linear", "/layers.14/mlp/up_proj/Linear/post_convert", "/layers.14/mlp/down_proj/Linear/pre_reshape", "/layers.14/mlp/down_proj/Linear/pre_convert", "/layers.14/mlp/down_proj/Linear", "/layers.14/mlp/down_proj/Linear/post_convert", "/layers.15/self_attn/q_proj/Linear/pre_reshape", "/layers.15/self_attn/q_proj/Linear/pre_convert", "/layers.15/self_attn/q_proj/Linear", "/layers.15/self_attn/q_proj/Linear/post_convert", "/layers.15/self_attn/k_proj/Linear/pre_reshape", "/layers.15/self_attn/k_proj/Linear/pre_convert", "/layers.15/self_attn/k_proj/Linear", "/layers.15/self_attn/k_proj/Linear/post_convert", "/layers.15/self_attn/v_proj/Linear/pre_reshape", "/layers.15/self_attn/v_proj/Linear/pre_convert", "/layers.15/self_attn/v_proj/Linear", "/layers.15/self_attn/v_proj/Linear/post_convert", "/layers.15/self_attn/o_proj/Linear/pre_reshape", "/layers.15/self_attn/o_proj/Linear/pre_convert", "/layers.15/self_attn/o_proj/Linear", "/layers.15/self_attn/o_proj/Linear/post_convert", "/layers.15/mlp/gate_proj/Linear/pre_reshape", "/layers.15/mlp/gate_proj/Linear/pre_convert", "/layers.15/mlp/gate_proj/Linear", "/layers.15/mlp/gate_proj/Linear/post_convert", "/layers.15/mlp/up_proj/Linear/pre_reshape", "/layers.15/mlp/up_proj/Linear/pre_convert", "/layers.15/mlp/up_proj/Linear", "/layers.15/mlp/up_proj/Linear/post_convert", "/layers.15/mlp/down_proj/Linear/pre_reshape", "/layers.15/mlp/down_proj/Linear/pre_convert", "/layers.15/mlp/down_proj/Linear", "/layers.15/mlp/down_proj/Linear/post_convert", "/layers.16/self_attn/q_proj/Linear/pre_reshape", "/layers.16/self_attn/q_proj/Linear/pre_convert", "/layers.16/self_attn/q_proj/Linear", "/layers.16/self_attn/q_proj/Linear/post_convert", "/layers.16/self_attn/k_proj/Linear/pre_reshape", "/layers.16/self_attn/k_proj/Linear/pre_convert", "/layers.16/self_attn/k_proj/Linear", "/layers.16/self_attn/k_proj/Linear/post_convert", "/layers.16/self_attn/v_proj/Linear/pre_reshape", "/layers.16/self_attn/v_proj/Linear/pre_convert", "/layers.16/self_attn/v_proj/Linear", "/layers.16/self_attn/v_proj/Linear/post_convert", "/layers.16/self_attn/o_proj/Linear/pre_reshape", "/layers.16/self_attn/o_proj/Linear/pre_convert", "/layers.16/self_attn/o_proj/Linear", "/layers.16/self_attn/o_proj/Linear/post_convert", "/layers.16/mlp/gate_proj/Linear/pre_reshape", "/layers.16/mlp/gate_proj/Linear/pre_convert", "/layers.16/mlp/gate_proj/Linear", "/layers.16/mlp/gate_proj/Linear/post_convert", "/layers.16/mlp/up_proj/Linear/pre_reshape", "/layers.16/mlp/up_proj/Linear/pre_convert", "/layers.16/mlp/up_proj/Linear", "/layers.16/mlp/up_proj/Linear/post_convert", "/layers.16/mlp/down_proj/Linear/pre_reshape", "/layers.16/mlp/down_proj/Linear/pre_convert", "/layers.16/mlp/down_proj/Linear", "/layers.16/mlp/down_proj/Linear/post_convert", "/layers.17/self_attn/q_proj/Linear/pre_reshape", "/layers.17/self_attn/q_proj/Linear/pre_convert", "/layers.17/self_attn/q_proj/Linear", "/layers.17/self_attn/q_proj/Linear/post_convert", "/layers.17/self_attn/k_proj/Linear/pre_reshape", "/layers.17/self_attn/k_proj/Linear/pre_convert", "/layers.17/self_attn/k_proj/Linear", "/layers.17/self_attn/k_proj/Linear/post_convert", "/layers.17/self_attn/v_proj/Linear/pre_reshape", "/layers.17/self_attn/v_proj/Linear/pre_convert", "/layers.17/self_attn/v_proj/Linear", "/layers.17/self_attn/v_proj/Linear/post_convert", "/layers.17/self_attn/o_proj/Linear/pre_reshape", "/layers.17/self_attn/o_proj/Linear/pre_convert", "/layers.17/self_attn/o_proj/Linear", "/layers.17/self_attn/o_proj/Linear/post_convert", "/layers.17/mlp/gate_proj/Linear/pre_reshape", "/layers.17/mlp/gate_proj/Linear/pre_convert", "/layers.17/mlp/gate_proj/Linear", "/layers.17/mlp/gate_proj/Linear/post_convert", "/layers.17/mlp/up_proj/Linear/pre_reshape", "/layers.17/mlp/up_proj/Linear/pre_convert", "/layers.17/mlp/up_proj/Linear", "/layers.17/mlp/up_proj/Linear/post_convert", "/layers.17/mlp/down_proj/Linear/pre_reshape", "/layers.17/mlp/down_proj/Linear/pre_convert", "/layers.17/mlp/down_proj/Linear", "/layers.17/mlp/down_proj/Linear/post_convert", "/layers.18/self_attn/q_proj/Linear/pre_reshape", "/layers.18/self_attn/q_proj/Linear/pre_convert", "/layers.18/self_attn/q_proj/Linear", "/layers.18/self_attn/q_proj/Linear/post_convert", "/layers.18/self_attn/k_proj/Linear/pre_reshape", "/layers.18/self_attn/k_proj/Linear/pre_convert", "/layers.18/self_attn/k_proj/Linear", "/layers.18/self_attn/k_proj/Linear/post_convert", "/layers.18/self_attn/v_proj/Linear/pre_reshape", "/layers.18/self_attn/v_proj/Linear/pre_convert", "/layers.18/self_attn/v_proj/Linear", "/layers.18/self_attn/v_proj/Linear/post_convert", "/layers.18/self_attn/o_proj/Linear/pre_reshape", "/layers.18/self_attn/o_proj/Linear/pre_convert", "/layers.18/self_attn/o_proj/Linear", "/layers.18/self_attn/o_proj/Linear/post_convert", "/layers.18/mlp/gate_proj/Linear/pre_reshape", "/layers.18/mlp/gate_proj/Linear/pre_convert", "/layers.18/mlp/gate_proj/Linear", "/layers.18/mlp/gate_proj/Linear/post_convert", "/layers.18/mlp/up_proj/Linear/pre_reshape", "/layers.18/mlp/up_proj/Linear/pre_convert", "/layers.18/mlp/up_proj/Linear", "/layers.18/mlp/up_proj/Linear/post_convert", "/layers.18/mlp/down_proj/Linear/pre_reshape", "/layers.18/mlp/down_proj/Linear/pre_convert", "/layers.18/mlp/down_proj/Linear", "/layers.18/mlp/down_proj/Linear/post_convert", "/layers.19/self_attn/q_proj/Linear/pre_reshape", "/layers.19/self_attn/q_proj/Linear/pre_convert", "/layers.19/self_attn/q_proj/Linear", "/layers.19/self_attn/q_proj/Linear/post_convert", "/layers.19/self_attn/k_proj/Linear/pre_reshape", "/layers.19/self_attn/k_proj/Linear/pre_convert", "/layers.19/self_attn/k_proj/Linear", "/layers.19/self_attn/k_proj/Linear/post_convert", "/layers.19/self_attn/v_proj/Linear/pre_reshape", "/layers.19/self_attn/v_proj/Linear/pre_convert", "/layers.19/self_attn/v_proj/Linear", "/layers.19/self_attn/v_proj/Linear/post_convert", "/layers.19/self_attn/o_proj/Linear/pre_reshape", "/layers.19/self_attn/o_proj/Linear/pre_convert", "/layers.19/self_attn/o_proj/Linear", "/layers.19/self_attn/o_proj/Linear/post_convert", "/layers.19/mlp/gate_proj/Linear/pre_reshape", "/layers.19/mlp/gate_proj/Linear/pre_convert", "/layers.19/mlp/gate_proj/Linear", "/layers.19/mlp/gate_proj/Linear/post_convert", "/layers.19/mlp/up_proj/Linear/pre_reshape", "/layers.19/mlp/up_proj/Linear/pre_convert", "/layers.19/mlp/up_proj/Linear", "/layers.19/mlp/up_proj/Linear/post_convert", "/layers.19/mlp/down_proj/Linear/pre_reshape", "/layers.19/mlp/down_proj/Linear/pre_convert", "/layers.19/mlp/down_proj/Linear", "/layers.19/mlp/down_proj/Linear/post_convert", "/layers.20/self_attn/q_proj/Linear/pre_reshape", "/layers.20/self_attn/q_proj/Linear/pre_convert", "/layers.20/self_attn/q_proj/Linear", "/layers.20/self_attn/q_proj/Linear/post_convert", "/layers.20/self_attn/k_proj/Linear/pre_reshape", "/layers.20/self_attn/k_proj/Linear/pre_convert", "/layers.20/self_attn/k_proj/Linear", "/layers.20/self_attn/k_proj/Linear/post_convert", "/layers.20/self_attn/v_proj/Linear/pre_reshape", "/layers.20/self_attn/v_proj/Linear/pre_convert", "/layers.20/self_attn/v_proj/Linear", "/layers.20/self_attn/v_proj/Linear/post_convert", "/layers.20/self_attn/o_proj/Linear/pre_reshape", "/layers.20/self_attn/o_proj/Linear/pre_convert", "/layers.20/self_attn/o_proj/Linear", "/layers.20/self_attn/o_proj/Linear/post_convert", "/layers.20/mlp/gate_proj/Linear/pre_reshape", "/layers.20/mlp/gate_proj/Linear/pre_convert", "/layers.20/mlp/gate_proj/Linear", "/layers.20/mlp/gate_proj/Linear/post_convert", "/layers.20/mlp/up_proj/Linear/pre_reshape", "/layers.20/mlp/up_proj/Linear/pre_convert", "/layers.20/mlp/up_proj/Linear", "/layers.20/mlp/up_proj/Linear/post_convert", "/layers.20/mlp/down_proj/Linear/pre_reshape", "/layers.20/mlp/down_proj/Linear/pre_convert", "/layers.20/mlp/down_proj/Linear", "/layers.20/mlp/down_proj/Linear/post_convert", "/layers.21/self_attn/q_proj/Linear/pre_reshape", "/layers.21/self_attn/q_proj/Linear/pre_convert", "/layers.21/self_attn/q_proj/Linear", "/layers.21/self_attn/q_proj/Linear/post_convert", "/layers.21/self_attn/k_proj/Linear/pre_reshape", "/layers.21/self_attn/k_proj/Linear/pre_convert", "/layers.21/self_attn/k_proj/Linear", "/layers.21/self_attn/k_proj/Linear/post_convert", "/layers.21/self_attn/v_proj/Linear/pre_reshape", "/layers.21/self_attn/v_proj/Linear/pre_convert", "/layers.21/self_attn/v_proj/Linear", "/layers.21/self_attn/v_proj/Linear/post_convert", "/layers.21/self_attn/o_proj/Linear/pre_reshape", "/layers.21/self_attn/o_proj/Linear/pre_convert", "/layers.21/self_attn/o_proj/Linear", "/layers.21/self_attn/o_proj/Linear/post_convert", "/layers.21/mlp/gate_proj/Linear/pre_reshape", "/layers.21/mlp/gate_proj/Linear/pre_convert", "/layers.21/mlp/gate_proj/Linear", "/layers.21/mlp/gate_proj/Linear/post_convert", "/layers.21/mlp/up_proj/Linear/pre_reshape", "/layers.21/mlp/up_proj/Linear/pre_convert", "/layers.21/mlp/up_proj/Linear", "/layers.21/mlp/up_proj/Linear/post_convert", "/layers.21/mlp/down_proj/Linear/pre_reshape", "/layers.21/mlp/down_proj/Linear/pre_convert", "/layers.21/mlp/down_proj/Linear", "/layers.21/mlp/down_proj/Linear/post_convert", "/layers.22/self_attn/q_proj/Linear/pre_reshape", "/layers.22/self_attn/q_proj/Linear/pre_convert", "/layers.22/self_attn/q_proj/Linear", "/layers.22/self_attn/q_proj/Linear/post_convert", "/layers.22/self_attn/k_proj/Linear/pre_reshape", "/layers.22/self_attn/k_proj/Linear/pre_convert", "/layers.22/self_attn/k_proj/Linear", "/layers.22/self_attn/k_proj/Linear/post_convert", "/layers.22/self_attn/v_proj/Linear/pre_reshape", "/layers.22/self_attn/v_proj/Linear/pre_convert", "/layers.22/self_attn/v_proj/Linear", "/layers.22/self_attn/v_proj/Linear/post_convert", "/layers.22/self_attn/o_proj/Linear/pre_reshape", "/layers.22/self_attn/o_proj/Linear/pre_convert", "/layers.22/self_attn/o_proj/Linear", "/layers.22/self_attn/o_proj/Linear/post_convert", "/layers.22/mlp/gate_proj/Linear/pre_reshape", "/layers.22/mlp/gate_proj/Linear/pre_convert", "/layers.22/mlp/gate_proj/Linear", "/layers.22/mlp/gate_proj/Linear/post_convert", "/layers.22/mlp/up_proj/Linear/pre_reshape", "/layers.22/mlp/up_proj/Linear/pre_convert", "/layers.22/mlp/up_proj/Linear", "/layers.22/mlp/up_proj/Linear/post_convert", "/layers.22/mlp/down_proj/Linear/pre_reshape", "/layers.22/mlp/down_proj/Linear/pre_convert", "/layers.22/mlp/down_proj/Linear", "/layers.22/mlp/down_proj/Linear/post_convert", "/layers.23/self_attn/q_proj/Linear/pre_reshape", "/layers.23/self_attn/q_proj/Linear/pre_convert", "/layers.23/self_attn/q_proj/Linear", "/layers.23/self_attn/q_proj/Linear/post_convert", "/layers.23/self_attn/k_proj/Linear/pre_reshape", "/layers.23/self_attn/k_proj/Linear/pre_convert", "/layers.23/self_attn/k_proj/Linear", "/layers.23/self_attn/k_proj/Linear/post_convert", "/layers.23/self_attn/v_proj/Linear/pre_reshape", "/layers.23/self_attn/v_proj/Linear/pre_convert", "/layers.23/self_attn/v_proj/Linear", "/layers.23/self_attn/v_proj/Linear/post_convert", "/layers.23/self_attn/o_proj/Linear/pre_reshape", "/layers.23/self_attn/o_proj/Linear/pre_convert", "/layers.23/self_attn/o_proj/Linear", "/layers.23/self_attn/o_proj/Linear/post_convert", "/layers.23/mlp/gate_proj/Linear/pre_reshape", "/layers.23/mlp/gate_proj/Linear/pre_convert", "/layers.23/mlp/gate_proj/Linear", "/layers.23/mlp/gate_proj/Linear/post_convert", "/layers.23/mlp/up_proj/Linear/pre_reshape", "/layers.23/mlp/up_proj/Linear/pre_convert", "/layers.23/mlp/up_proj/Linear", "/layers.23/mlp/up_proj/Linear/post_convert", "/layers.23/mlp/down_proj/Linear/pre_reshape", "/layers.23/mlp/down_proj/Linear/pre_convert", "/layers.23/mlp/down_proj/Linear", "/layers.23/mlp/down_proj/Linear/post_convert", "/lm/lm_head/Linear/pre_reshape", "/lm/lm_head/Linear/pre_convert", "/lm/lm_head/Linear", "/lm/lm_head/Linear/post_convert" ] , "tensorNumber": 0, "usage": "INFERENCE", "mnn_uuid": "add4ef8e-e3b2-432a-9957-34e7387a98b1" }